| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421 |
- package tools
- import (
- "os"
- "path/filepath"
- "regexp"
- "testing"
- "github.com/stretchr/testify/require"
- )
- func TestRegexCache(t *testing.T) {
- cache := newRegexCache()
- // Test basic caching
- pattern := "test.*pattern"
- regex1, err := cache.get(pattern)
- if err != nil {
- t.Fatalf("Failed to compile regex: %v", err)
- }
- regex2, err := cache.get(pattern)
- if err != nil {
- t.Fatalf("Failed to get cached regex: %v", err)
- }
- // Should be the same instance (cached)
- if regex1 != regex2 {
- t.Error("Expected cached regex to be the same instance")
- }
- // Test that it actually works
- if !regex1.MatchString("test123pattern") {
- t.Error("Regex should match test string")
- }
- }
- func TestGlobToRegexCaching(t *testing.T) {
- // Test that globToRegex uses pre-compiled regex
- pattern1 := globToRegex("*.{js,ts}")
- // Should not panic and should work correctly
- regex1, err := regexp.Compile(pattern1)
- if err != nil {
- t.Fatalf("Failed to compile glob regex: %v", err)
- }
- if !regex1.MatchString("test.js") {
- t.Error("Glob regex should match .js files")
- }
- if !regex1.MatchString("test.ts") {
- t.Error("Glob regex should match .ts files")
- }
- if regex1.MatchString("test.go") {
- t.Error("Glob regex should not match .go files")
- }
- }
- func TestGrepWithIgnoreFiles(t *testing.T) {
- t.Parallel()
- tempDir := t.TempDir()
- // Create test files
- testFiles := map[string]string{
- "file1.txt": "hello world",
- "file2.txt": "hello world",
- "ignored/file3.txt": "hello world",
- "node_modules/lib.js": "hello world",
- "secret.key": "hello world",
- }
- for path, content := range testFiles {
- fullPath := filepath.Join(tempDir, path)
- require.NoError(t, os.MkdirAll(filepath.Dir(fullPath), 0o755))
- require.NoError(t, os.WriteFile(fullPath, []byte(content), 0o644))
- }
- // Create .gitignore file
- gitignoreContent := "ignored/\n*.key\n"
- require.NoError(t, os.WriteFile(filepath.Join(tempDir, ".gitignore"), []byte(gitignoreContent), 0o644))
- // Create .crushignore file
- crushignoreContent := "node_modules/\n"
- require.NoError(t, os.WriteFile(filepath.Join(tempDir, ".crushignore"), []byte(crushignoreContent), 0o644))
- // Test both implementations
- for name, fn := range map[string]func(pattern, path, include string) ([]grepMatch, error){
- "regex": searchFilesWithRegex,
- "rg": func(pattern, path, include string) ([]grepMatch, error) {
- return searchWithRipgrep(t.Context(), pattern, path, include)
- },
- } {
- t.Run(name, func(t *testing.T) {
- t.Parallel()
- if name == "rg" && getRg() == "" {
- t.Skip("rg is not in $PATH")
- }
- matches, err := fn("hello world", tempDir, "")
- require.NoError(t, err)
- // Convert matches to a set of file paths for easier testing
- foundFiles := make(map[string]bool)
- for _, match := range matches {
- foundFiles[filepath.Base(match.path)] = true
- }
- // Should find file1.txt and file2.txt
- require.True(t, foundFiles["file1.txt"], "Should find file1.txt")
- require.True(t, foundFiles["file2.txt"], "Should find file2.txt")
- // Should NOT find ignored files
- require.False(t, foundFiles["file3.txt"], "Should not find file3.txt (ignored by .gitignore)")
- require.False(t, foundFiles["lib.js"], "Should not find lib.js (ignored by .crushignore)")
- require.False(t, foundFiles["secret.key"], "Should not find secret.key (ignored by .gitignore)")
- // Should find exactly 2 matches
- require.Equal(t, 2, len(matches), "Should find exactly 2 matches")
- })
- }
- }
- func TestSearchImplementations(t *testing.T) {
- t.Parallel()
- tempDir := t.TempDir()
- for path, content := range map[string]string{
- "file1.go": "package main\nfunc main() {\n\tfmt.Println(\"hello world\")\n}",
- "file2.js": "console.log('hello world');",
- "file3.txt": "hello world from text file",
- "binary.exe": "\x00\x01\x02\x03",
- "empty.txt": "",
- "subdir/nested.go": "package nested\n// hello world comment",
- ".hidden.txt": "hello world in hidden file",
- "file4.txt": "hello world from a banana",
- "file5.txt": "hello world from a grape",
- } {
- fullPath := filepath.Join(tempDir, path)
- require.NoError(t, os.MkdirAll(filepath.Dir(fullPath), 0o755))
- require.NoError(t, os.WriteFile(fullPath, []byte(content), 0o644))
- }
- require.NoError(t, os.WriteFile(filepath.Join(tempDir, ".gitignore"), []byte("file4.txt\n"), 0o644))
- require.NoError(t, os.WriteFile(filepath.Join(tempDir, ".crushignore"), []byte("file5.txt\n"), 0o644))
- for name, fn := range map[string]func(pattern, path, include string) ([]grepMatch, error){
- "regex": searchFilesWithRegex,
- "rg": func(pattern, path, include string) ([]grepMatch, error) {
- return searchWithRipgrep(t.Context(), pattern, path, include)
- },
- } {
- t.Run(name, func(t *testing.T) {
- t.Parallel()
- if name == "rg" && getRg() == "" {
- t.Skip("rg is not in $PATH")
- }
- matches, err := fn("hello world", tempDir, "")
- require.NoError(t, err)
- require.Equal(t, len(matches), 4)
- for _, match := range matches {
- require.NotEmpty(t, match.path)
- require.NotZero(t, match.lineNum)
- require.NotEmpty(t, match.lineText)
- require.NotZero(t, match.modTime)
- require.NotContains(t, match.path, ".hidden.txt")
- require.NotContains(t, match.path, "file4.txt")
- require.NotContains(t, match.path, "file5.txt")
- require.NotContains(t, match.path, "binary.exe")
- }
- })
- }
- }
- // Benchmark to show performance improvement
- func BenchmarkRegexCacheVsCompile(b *testing.B) {
- cache := newRegexCache()
- pattern := "test.*pattern.*[0-9]+"
- b.Run("WithCache", func(b *testing.B) {
- for b.Loop() {
- _, err := cache.get(pattern)
- if err != nil {
- b.Fatal(err)
- }
- }
- })
- b.Run("WithoutCache", func(b *testing.B) {
- for b.Loop() {
- _, err := regexp.Compile(pattern)
- if err != nil {
- b.Fatal(err)
- }
- }
- })
- }
- func TestIsTextFile(t *testing.T) {
- t.Parallel()
- tempDir := t.TempDir()
- tests := []struct {
- name string
- filename string
- content []byte
- wantText bool
- }{
- {
- name: "go file",
- filename: "test.go",
- content: []byte("package main\n\nfunc main() {}\n"),
- wantText: true,
- },
- {
- name: "yaml file",
- filename: "config.yaml",
- content: []byte("key: value\nlist:\n - item1\n - item2\n"),
- wantText: true,
- },
- {
- name: "yml file",
- filename: "config.yml",
- content: []byte("key: value\n"),
- wantText: true,
- },
- {
- name: "json file",
- filename: "data.json",
- content: []byte(`{"key": "value"}`),
- wantText: true,
- },
- {
- name: "javascript file",
- filename: "script.js",
- content: []byte("console.log('hello');\n"),
- wantText: true,
- },
- {
- name: "typescript file",
- filename: "script.ts",
- content: []byte("const x: string = 'hello';\n"),
- wantText: true,
- },
- {
- name: "markdown file",
- filename: "README.md",
- content: []byte("# Title\n\nSome content\n"),
- wantText: true,
- },
- {
- name: "shell script",
- filename: "script.sh",
- content: []byte("#!/bin/bash\necho 'hello'\n"),
- wantText: true,
- },
- {
- name: "python file",
- filename: "script.py",
- content: []byte("print('hello')\n"),
- wantText: true,
- },
- {
- name: "xml file",
- filename: "data.xml",
- content: []byte("<?xml version=\"1.0\"?>\n<root></root>\n"),
- wantText: true,
- },
- {
- name: "plain text",
- filename: "file.txt",
- content: []byte("plain text content\n"),
- wantText: true,
- },
- {
- name: "css file",
- filename: "style.css",
- content: []byte("body { color: red; }\n"),
- wantText: true,
- },
- {
- name: "scss file",
- filename: "style.scss",
- content: []byte("$primary: blue;\nbody { color: $primary; }\n"),
- wantText: true,
- },
- {
- name: "sass file",
- filename: "style.sass",
- content: []byte("$primary: blue\nbody\n color: $primary\n"),
- wantText: true,
- },
- {
- name: "rust file",
- filename: "main.rs",
- content: []byte("fn main() {\n println!(\"Hello, world!\");\n}\n"),
- wantText: true,
- },
- {
- name: "zig file",
- filename: "main.zig",
- content: []byte("const std = @import(\"std\");\npub fn main() void {}\n"),
- wantText: true,
- },
- {
- name: "java file",
- filename: "Main.java",
- content: []byte("public class Main {\n public static void main(String[] args) {}\n}\n"),
- wantText: true,
- },
- {
- name: "c file",
- filename: "main.c",
- content: []byte("#include <stdio.h>\nint main() { return 0; }\n"),
- wantText: true,
- },
- {
- name: "cpp file",
- filename: "main.cpp",
- content: []byte("#include <iostream>\nint main() { return 0; }\n"),
- wantText: true,
- },
- {
- name: "fish shell",
- filename: "script.fish",
- content: []byte("#!/usr/bin/env fish\necho 'hello'\n"),
- wantText: true,
- },
- {
- name: "powershell file",
- filename: "script.ps1",
- content: []byte("Write-Host 'Hello, World!'\n"),
- wantText: true,
- },
- {
- name: "cmd batch file",
- filename: "script.bat",
- content: []byte("@echo off\necho Hello, World!\n"),
- wantText: true,
- },
- {
- name: "cmd file",
- filename: "script.cmd",
- content: []byte("@echo off\necho Hello, World!\n"),
- wantText: true,
- },
- {
- name: "binary exe",
- filename: "binary.exe",
- content: []byte{0x4D, 0x5A, 0x90, 0x00, 0x03, 0x00, 0x00, 0x00},
- wantText: false,
- },
- {
- name: "png image",
- filename: "image.png",
- content: []byte{0x89, 0x50, 0x4E, 0x47, 0x0D, 0x0A, 0x1A, 0x0A},
- wantText: false,
- },
- {
- name: "jpeg image",
- filename: "image.jpg",
- content: []byte{0xFF, 0xD8, 0xFF, 0xE0, 0x00, 0x10, 0x4A, 0x46},
- wantText: false,
- },
- {
- name: "zip archive",
- filename: "archive.zip",
- content: []byte{0x50, 0x4B, 0x03, 0x04, 0x14, 0x00, 0x00, 0x00},
- wantText: false,
- },
- {
- name: "pdf file",
- filename: "document.pdf",
- content: []byte("%PDF-1.4\n%âãÏÓ\n"),
- wantText: false,
- },
- }
- for _, tt := range tests {
- t.Run(tt.name, func(t *testing.T) {
- t.Parallel()
- filePath := filepath.Join(tempDir, tt.filename)
- require.NoError(t, os.WriteFile(filePath, tt.content, 0o644))
- got := isTextFile(filePath)
- require.Equal(t, tt.wantText, got, "isTextFile(%s) = %v, want %v", tt.filename, got, tt.wantText)
- })
- }
- }
- func TestColumnMatch(t *testing.T) {
- t.Parallel()
- // Test both implementations
- for name, fn := range map[string]func(pattern, path, include string) ([]grepMatch, error){
- "regex": searchFilesWithRegex,
- "rg": func(pattern, path, include string) ([]grepMatch, error) {
- return searchWithRipgrep(t.Context(), pattern, path, include)
- },
- } {
- t.Run(name, func(t *testing.T) {
- t.Parallel()
- if name == "rg" && getRg() == "" {
- t.Skip("rg is not in $PATH")
- }
- matches, err := fn("THIS", "./testdata/", "")
- require.NoError(t, err)
- require.Len(t, matches, 1)
- match := matches[0]
- require.Equal(t, 2, match.lineNum)
- require.Equal(t, 14, match.charNum)
- require.Equal(t, "I wanna grep THIS particular word", match.lineText)
- require.Equal(t, "testdata/grep.txt", filepath.ToSlash(filepath.Clean(match.path)))
- })
- }
- }
|