82 lines
3.2 KiB
Bash
Executable File
82 lines
3.2 KiB
Bash
Executable File
#!/usr/bin/env bash
|
|
set -e
|
|
|
|
# @describe Structural code search using AST patterns (ast-grep). Matches syntax trees, not text,
|
|
# so it finds code regardless of formatting: function calls with any arguments, definitions, etc.
|
|
# Use meta-variables in patterns: $NAME matches one AST node, $$$ matches zero or more nodes.
|
|
# Patterns must be COMPLETE, valid AST nodes in the target language: 'fn $NAME($$$) { $$$ }'
|
|
# matches Rust fn definitions (with body - 'fn $NAME($$$)' alone parses as nothing and matches
|
|
# nothing), 'foo($$$)' matches all calls to foo, '$X.unwrap()' matches all unwrap calls.
|
|
# Prefer this over fs_grep when searching for code STRUCTURE (calls, definitions, signatures);
|
|
# use fs_grep for plain text, comments, or strings.
|
|
|
|
# @option --pattern! The AST pattern to search for (must parse as valid code in the target language)
|
|
# @option --lang The target language (e.g. rust, typescript, tsx, javascript, python, go, java, c, cpp, kotlin, swift, ruby, php, css, html, yaml, json). Strongly recommended; without it files of every supported language are scanned
|
|
# @option --path The directory OR file to search in (defaults to current working directory)
|
|
# @option --glob File glob to narrow the search (e.g. "src/**/*.rs", "!**/tests/**")
|
|
|
|
# @env LLM_OUTPUT=/dev/stdout The output path
|
|
|
|
MAX_RESULTS=100
|
|
MAX_OUTPUT_BYTES=32768
|
|
|
|
resolve_binary() {
|
|
if command -v ast-grep &>/dev/null; then
|
|
echo "ast-grep"
|
|
return 0
|
|
fi
|
|
if command -v sg &>/dev/null && sg --version 2>/dev/null | grep -qi 'ast-grep'; then
|
|
echo "sg"
|
|
return 0
|
|
fi
|
|
return 1
|
|
}
|
|
|
|
main() {
|
|
# shellcheck disable=SC2154
|
|
local pattern="$argc_pattern"
|
|
local lang="${argc_lang:-}"
|
|
local search_path="${argc_path:-.}"
|
|
local glob="${argc_glob:-}"
|
|
|
|
local bin
|
|
if ! bin=$(resolve_binary); then
|
|
printf 'ast-grep is not installed. Fall back to fs_grep for this search.\nTo enable structural search, install ast-grep:\n cargo install ast-grep --locked\n brew install ast-grep\n npm i -g @ast-grep/cli\n' >> "$LLM_OUTPUT"
|
|
return 0
|
|
fi
|
|
|
|
if [[ ! -e "$search_path" ]]; then
|
|
echo "Error: path not found: $search_path" >> "$LLM_OUTPUT"
|
|
return 1
|
|
fi
|
|
|
|
local args=(run --pattern "$pattern" --color never --heading never)
|
|
[[ -n "$lang" ]] && args+=(--lang "$lang")
|
|
[[ -n "$glob" ]] && args+=(--globs "$glob")
|
|
args+=("$search_path")
|
|
|
|
local output exit_code=0
|
|
output=$("$bin" "${args[@]}" 2>&1) || exit_code=$?
|
|
|
|
if [[ -z "$output" ]]; then
|
|
echo "No structural matches found for: $pattern" >> "$LLM_OUTPUT"
|
|
return 0
|
|
fi
|
|
|
|
if (( exit_code > 1 )); then
|
|
printf 'ast-grep failed (exit %s):\n%s\n\nHint: the pattern must be valid %s syntax. Meta-variables: $NAME (one node), $$$ (zero or more).\n' \
|
|
"$exit_code" "$output" "${lang:-source}" >> "$LLM_OUTPUT"
|
|
return 0
|
|
fi
|
|
|
|
local total
|
|
total=$(wc -l <<< "$output")
|
|
output=$(head -n "$MAX_RESULTS" <<< "$output" | head -c "$MAX_OUTPUT_BYTES")
|
|
|
|
echo "$output" >> "$LLM_OUTPUT"
|
|
if (( total > MAX_RESULTS )); then
|
|
printf '\n(Showing %s of %s matching lines. Narrow with --glob, --lang, or a more specific pattern.)\n' \
|
|
"$MAX_RESULTS" "$total" >> "$LLM_OUTPUT"
|
|
fi
|
|
}
|