Improve GCP workload identity federation evidence #997

Workflow file for this run

.github/workflows/injection-scan.yml at 0d32993

	name: Prompt Injection Scan

	on:
	pull_request:

	permissions:
	contents: read

	jobs:
	injection-scan:
	runs-on: ubuntu-latest
	steps:
	- name: Checkout repository
	uses: actions/checkout@v4 # pin to SHA for SLSA compliance in future iteration

	- name: Scan for prompt injection patterns
	run: \|
	# HIGH-CONFIDENCE injection patterns — phrases that should never
	# appear in skill files outside of clearly defensive contexts.
	# These are imperative commands directed at the agent, not
	# descriptions of attacks or technical terminology.
	PATTERNS=(
	"new directive"
	"system override"
	"forget your instructions"
	"send to http"
	"curl -X POST"
	"api.telegram"
	"discord.com/api/webhooks"
	"hooks.slack.com/services"
	)

	FOUND_ISSUES=0

	for pattern in "${PATTERNS[@]}"; do
	MATCHES=$(grep -rin "$pattern" skills/ roles/ --include="*.md" 2>/dev/null \|\| true)
	if [ -n "$MATCHES" ]; then
	# Exclude ai-security/ files (contain educational attack examples)
	FILTERED=$(echo "$MATCHES" \| grep -v "ai-security/prompt-injection/\\|ai-security/llm-top-10/\\|ai-security/agentic-top-10/\\|ai-security/agent-security/\\|ai-security/model-supply-chain/\\|ai-security/ai-data-privacy/" \|\| true)
	if [ -n "$FILTERED" ]; then
	echo "FOUND injection pattern \"$pattern\":"
	echo "$FILTERED"
	echo ""
	FOUND_ISSUES=1
	fi
	fi
	done

	# CONTEXT-DEPENDENT patterns — these words appear legitimately in
	# security content (e.g., "Never exfiltrate data", "webhook URL").
	# Only flag them when they appear as bare imperatives, not in
	# defensive safety notices or technical descriptions.
	# We scan for the imperative/attack forms specifically:
	IMPERATIVE_PATTERNS=(
	"ignore previous instructions and"
	"ignore all previous instructions"
	"you are now a"
	"you are now in"
	"disregard your"
	"disregard all previous"
	)

	for pattern in "${IMPERATIVE_PATTERNS[@]}"; do
	MATCHES=$(grep -rin "$pattern" skills/ roles/ --include="*.md" 2>/dev/null \|\| true)
	if [ -n "$MATCHES" ]; then
	# Exclude ai-security/ (educational) and lines with defensive context
	FILTERED=$(echo "$MATCHES" \
	\| grep -v "ai-security/prompt-injection/\\|ai-security/llm-top-10/\\|ai-security/agentic-top-10/\\|ai-security/agent-security/\\|ai-security/model-supply-chain/\\|ai-security/ai-data-privacy/" \
	\| grep -v "treat it as" \
	\| grep -v "not a command" \
	\| grep -v "not as a directive" \
	\| grep -v "not obeyed" \
	\| grep -v "flag it as" \
	\| grep -v "e\.g\.\," \
	\| grep -v "such as" \
	\| grep -v "contains text like" \
	\|\| true)
	if [ -n "$FILTERED" ]; then
	echo "FOUND imperative injection pattern \"$pattern\":"
	echo "$FILTERED"
	echo ""
	FOUND_ISSUES=1
	fi
	fi
	done

	if [ "$FOUND_ISSUES" -ne 0 ]; then
	echo "FAIL: Prompt injection patterns detected. Review flagged lines above."
	echo ""
	echo "NOTE: The ai-security/ directory and lines with defensive context"
	echo "(e.g., 'treat it as a finding') are excluded automatically."
	exit 1
	fi

	echo "PASS: No prompt injection patterns detected."

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Improve GCP workload identity federation evidence #997

Workflow file

Improve GCP workload identity federation evidence #997

Uh oh!

Workflow file for this run