| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359 |
- package tools
- import (
- "bufio"
- "context"
- "encoding/json"
- "fmt"
- "os"
- "os/exec"
- "path/filepath"
- "regexp"
- "sort"
- "strconv"
- "strings"
- "time"
- "github.com/sst/opencode/internal/config"
- "github.com/sst/opencode/internal/fileutil"
- )
- type GrepParams struct {
- Pattern string `json:"pattern"`
- Path string `json:"path"`
- Include string `json:"include"`
- LiteralText bool `json:"literal_text"`
- }
- type grepMatch struct {
- path string
- modTime time.Time
- lineNum int
- lineText string
- }
- type GrepResponseMetadata struct {
- NumberOfMatches int `json:"number_of_matches"`
- Truncated bool `json:"truncated"`
- }
- type grepTool struct{}
- const (
- GrepToolName = "grep"
- grepDescription = `Fast content search tool that finds files containing specific text or patterns, returning matching file paths sorted by modification time (newest first).
- WHEN TO USE THIS TOOL:
- - Use when you need to find files containing specific text or patterns
- - Great for searching code bases for function names, variable declarations, or error messages
- - Useful for finding all files that use a particular API or pattern
- HOW TO USE:
- - Provide a regex pattern to search for within file contents
- - Set literal_text=true if you want to search for the exact text with special characters (recommended for non-regex users)
- - Optionally specify a starting directory (defaults to current working directory)
- - Optionally provide an include pattern to filter which files to search
- - Results are sorted with most recently modified files first
- REGEX PATTERN SYNTAX (when literal_text=false):
- - Supports standard regular expression syntax
- - 'function' searches for the literal text "function"
- - 'log\..*Error' finds text starting with "log." and ending with "Error"
- - 'import\s+.*\s+from' finds import statements in JavaScript/TypeScript
- COMMON INCLUDE PATTERN EXAMPLES:
- - '*.js' - Only search JavaScript files
- - '*.{ts,tsx}' - Only search TypeScript files
- - '*.go' - Only search Go files
- LIMITATIONS:
- - Results are limited to 100 files (newest first)
- - Performance depends on the number of files being searched
- - Very large binary files may be skipped
- - Hidden files (starting with '.') are skipped
- TIPS:
- - For faster, more targeted searches, first use Glob to find relevant files, then use Grep
- - When doing iterative exploration that may require multiple rounds of searching, consider using the Agent tool instead
- - Always check if results are truncated and refine your search pattern if needed
- - Use literal_text=true when searching for exact text containing special characters like dots, parentheses, etc.`
- )
- func NewGrepTool() BaseTool {
- return &grepTool{}
- }
- func (g *grepTool) Info() ToolInfo {
- return ToolInfo{
- Name: GrepToolName,
- Description: grepDescription,
- Parameters: map[string]any{
- "pattern": map[string]any{
- "type": "string",
- "description": "The regex pattern to search for in file contents",
- },
- "path": map[string]any{
- "type": "string",
- "description": "The directory to search in. Defaults to the current working directory.",
- },
- "include": map[string]any{
- "type": "string",
- "description": "File pattern to include in the search (e.g. \"*.js\", \"*.{ts,tsx}\")",
- },
- "literal_text": map[string]any{
- "type": "boolean",
- "description": "If true, the pattern will be treated as literal text with special regex characters escaped. Default is false.",
- },
- },
- Required: []string{"pattern"},
- }
- }
- // escapeRegexPattern escapes special regex characters so they're treated as literal characters
- func escapeRegexPattern(pattern string) string {
- specialChars := []string{"\\", ".", "+", "*", "?", "(", ")", "[", "]", "{", "}", "^", "$", "|"}
- escaped := pattern
- for _, char := range specialChars {
- escaped = strings.ReplaceAll(escaped, char, "\\"+char)
- }
- return escaped
- }
- func (g *grepTool) Run(ctx context.Context, call ToolCall) (ToolResponse, error) {
- var params GrepParams
- if err := json.Unmarshal([]byte(call.Input), ¶ms); err != nil {
- return NewTextErrorResponse(fmt.Sprintf("error parsing parameters: %s", err)), nil
- }
- if params.Pattern == "" {
- return NewTextErrorResponse("pattern is required"), nil
- }
- // If literal_text is true, escape the pattern
- searchPattern := params.Pattern
- if params.LiteralText {
- searchPattern = escapeRegexPattern(params.Pattern)
- }
- searchPath := params.Path
- if searchPath == "" {
- searchPath = config.WorkingDirectory()
- }
- matches, truncated, err := searchFiles(searchPattern, searchPath, params.Include, 100)
- if err != nil {
- return ToolResponse{}, fmt.Errorf("error searching files: %w", err)
- }
- var output string
- if len(matches) == 0 {
- output = "No files found"
- } else {
- output = fmt.Sprintf("Found %d matches\n", len(matches))
- currentFile := ""
- for _, match := range matches {
- if currentFile != match.path {
- if currentFile != "" {
- output += "\n"
- }
- currentFile = match.path
- output += fmt.Sprintf("%s:\n", match.path)
- }
- if match.lineNum > 0 {
- output += fmt.Sprintf(" Line %d: %s\n", match.lineNum, match.lineText)
- } else {
- output += fmt.Sprintf(" %s\n", match.path)
- }
- }
- if truncated {
- output += "\n(Results are truncated. Consider using a more specific path or pattern.)"
- }
- }
- return WithResponseMetadata(
- NewTextResponse(output),
- GrepResponseMetadata{
- NumberOfMatches: len(matches),
- Truncated: truncated,
- },
- ), nil
- }
- func searchFiles(pattern, rootPath, include string, limit int) ([]grepMatch, bool, error) {
- matches, err := searchWithRipgrep(pattern, rootPath, include)
- if err != nil {
- matches, err = searchFilesWithRegex(pattern, rootPath, include)
- if err != nil {
- return nil, false, err
- }
- }
- sort.Slice(matches, func(i, j int) bool {
- return matches[i].modTime.After(matches[j].modTime)
- })
- truncated := len(matches) > limit
- if truncated {
- matches = matches[:limit]
- }
- return matches, truncated, nil
- }
- func searchWithRipgrep(pattern, path, include string) ([]grepMatch, error) {
- _, err := exec.LookPath("rg")
- if err != nil {
- return nil, fmt.Errorf("ripgrep not found: %w", err)
- }
- // Use -n to show line numbers and include the matched line
- args := []string{"-n", pattern}
- if include != "" {
- args = append(args, "--glob", include)
- }
- args = append(args, path)
- cmd := exec.Command("rg", args...)
- output, err := cmd.Output()
- if err != nil {
- if exitErr, ok := err.(*exec.ExitError); ok && exitErr.ExitCode() == 1 {
- return []grepMatch{}, nil
- }
- return nil, err
- }
- lines := strings.Split(strings.TrimSpace(string(output)), "\n")
- matches := make([]grepMatch, 0, len(lines))
- for _, line := range lines {
- if line == "" {
- continue
- }
- // Parse ripgrep output format: file:line:content
- parts := strings.SplitN(line, ":", 3)
- if len(parts) < 3 {
- continue
- }
- filePath := parts[0]
- lineNum, err := strconv.Atoi(parts[1])
- if err != nil {
- continue
- }
- lineText := parts[2]
- fileInfo, err := os.Stat(filePath)
- if err != nil {
- continue // Skip files we can't access
- }
- matches = append(matches, grepMatch{
- path: filePath,
- modTime: fileInfo.ModTime(),
- lineNum: lineNum,
- lineText: lineText,
- })
- }
- return matches, nil
- }
- func searchFilesWithRegex(pattern, rootPath, include string) ([]grepMatch, error) {
- matches := []grepMatch{}
- regex, err := regexp.Compile(pattern)
- if err != nil {
- return nil, fmt.Errorf("invalid regex pattern: %w", err)
- }
- var includePattern *regexp.Regexp
- if include != "" {
- regexPattern := globToRegex(include)
- includePattern, err = regexp.Compile(regexPattern)
- if err != nil {
- return nil, fmt.Errorf("invalid include pattern: %w", err)
- }
- }
- err = filepath.Walk(rootPath, func(path string, info os.FileInfo, err error) error {
- if err != nil {
- return nil // Skip errors
- }
- if info.IsDir() {
- return nil // Skip directories
- }
- if fileutil.SkipHidden(path) {
- return nil
- }
- if includePattern != nil && !includePattern.MatchString(path) {
- return nil
- }
- match, lineNum, lineText, err := fileContainsPattern(path, regex)
- if err != nil {
- return nil // Skip files we can't read
- }
- if match {
- matches = append(matches, grepMatch{
- path: path,
- modTime: info.ModTime(),
- lineNum: lineNum,
- lineText: lineText,
- })
- if len(matches) >= 200 {
- return filepath.SkipAll
- }
- }
- return nil
- })
- if err != nil {
- return nil, err
- }
- return matches, nil
- }
- func fileContainsPattern(filePath string, pattern *regexp.Regexp) (bool, int, string, error) {
- file, err := os.Open(filePath)
- if err != nil {
- return false, 0, "", err
- }
- defer file.Close()
- scanner := bufio.NewScanner(file)
- lineNum := 0
- for scanner.Scan() {
- lineNum++
- line := scanner.Text()
- if pattern.MatchString(line) {
- return true, lineNum, line, nil
- }
- }
- return false, 0, "", scanner.Err()
- }
- func globToRegex(glob string) string {
- regexPattern := strings.ReplaceAll(glob, ".", "\\.")
- regexPattern = strings.ReplaceAll(regexPattern, "*", ".*")
- regexPattern = strings.ReplaceAll(regexPattern, "?", ".")
- re := regexp.MustCompile(`\{([^}]+)\}`)
- regexPattern = re.ReplaceAllStringFunc(regexPattern, func(match string) string {
- inner := match[1 : len(match)-1]
- return "(" + strings.ReplaceAll(inner, ",", "|") + ")"
- })
- return regexPattern
- }
|