voarsh2 · voarsh2 · Feb 9, 2026 · Feb 9, 2026 · Feb 9, 2026 · Feb 9, 2026
diff --git a/.github/workflows/claude.yaml b/.github/workflows/claude.yaml
@@ -0,0 +1,68 @@
+name: Claude Code
+
+on:
+  issue_comment:
+    types: [created]
+  pull_request_review_comment:
+    types: [created]
+  issues:
+    types: [opened]
+  pull_request_review:
+    types: [submitted]
+  pull_request_target:
+    types: [opened, synchronize]
+
+jobs:
+  claude:
+    # This simplified condition is more robust and correctly checks permissions.
+    if: >
+      (contains(github.event.comment.body, '@claude') ||
+      contains(github.event.review.body, '@claude') ||
+      contains(github.event.issue.body, '@claude') ||
+      contains(github.event.pull_request.body, '@claude')) &&
+      (github.event.sender.type == 'User' && (
+        github.event.comment.author_association == 'OWNER' ||
+        github.event.comment.author_association == 'MEMBER' ||
+        github.event.comment.author_association == 'COLLABORATOR'
+      ))
-    if: >
-      (contains(github.event.comment.body, '@claude') ||
-      contains(github.event.review.body, '@claude') ||
-      contains(github.event.issue.body, '@claude') ||
-      contains(github.event.pull_request.body, '@claude')) &&
-      (github.event.sender.type == 'User' && (
-        github.event.comment.author_association == 'OWNER' ||
-        github.event.comment.author_association == 'MEMBER' ||
-        github.event.comment.author_association == 'COLLABORATOR'
-      ))
+    if: >
+      (contains(github.event.comment.body, '@claude') ||
+      contains(github.event.review.body, '@claude') ||
+      contains(github.event.issue.body, '@claude') ||
+      contains(github.event.pull_request.body, '@claude')) &&
+      github.event.sender.type == 'User' && (
+        github.event.comment.author_association == 'OWNER' ||
+        github.event.comment.author_association == 'MEMBER' ||
+        github.event.comment.author_association == 'COLLABORATOR' ||
+        github.event.review.author_association == 'OWNER' ||
+        github.event.review.author_association == 'MEMBER' ||
+        github.event.review.author_association == 'COLLABORATOR' ||
+        github.event.issue.author_association == 'OWNER' ||
+        github.event.issue.author_association == 'MEMBER' ||
+        github.event.issue.author_association == 'COLLABORATOR' ||
+        github.event.pull_request.author_association == 'OWNER' ||
+        github.event.pull_request.author_association == 'MEMBER' ||
+        github.event.pull_request.author_association == 'COLLABORATOR'
+      )
-    if: >
-      (contains(github.event.comment.body, '@claude') ||
-      contains(github.event.review.body, '@claude') ||
-      contains(github.event.issue.body, '@claude') ||
-      contains(github.event.pull_request.body, '@claude')) &&
-      (github.event.sender.type == 'User' && (
-        github.event.comment.author_association == 'OWNER' ||
-        github.event.comment.author_association == 'MEMBER' ||
-        github.event.comment.author_association == 'COLLABORATOR'
-      ))
+    if: >
+      (contains(github.event.comment.body, '@claude') ||
+      contains(github.event.review.body, '@claude') ||
+      contains(github.event.issue.body, '@claude') ||
+      contains(github.event.pull_request.body, '@claude')) &&
+      github.event.sender.type == 'User' && (
+        github.event.comment.author_association == 'OWNER' ||
+        github.event.comment.author_association == 'MEMBER' ||
+        github.event.comment.author_association == 'COLLABORATOR' ||
+        github.event.review.author_association == 'OWNER' ||
+        github.event.review.author_association == 'MEMBER' ||
+        github.event.review.author_association == 'COLLABORATOR' ||
+        github.event.issue.author_association == 'OWNER' ||
+        github.event.issue.author_association == 'MEMBER' ||
+        github.event.issue.author_association == 'COLLABORATOR' ||
+        github.event.pull_request.author_association == 'OWNER' ||
+        github.event.pull_request.author_association == 'MEMBER' ||
+        github.event.pull_request.author_association == 'COLLABORATOR'
+      )
+    runs-on: ubuntu-latest
+    permissions:
+      # CRITICAL: Write permissions are required for the action to push branches and update issues/PRs.
+      contents: write
+      pull-requests: write
+      issues: write
+      id-token: write # Required for OIDC token exchange
+      actions: read  # Required for Claude to read CI results on PRs
+
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+        with:
+          # This correctly checks out the PR's head commit for pull_request_target events.
+          ref: ${{ github.event.pull_request.head.sha }}
+
+      - name: Create Claude settings file
+        run: |
+          mkdir -p /home/runner/.claude
+          cat > /home/runner/.claude/settings.json << 'EOF'
+          {
+            "env": {
+              "ANTHROPIC_BASE_URL": "https://api.z.ai/api/anthropic",
+              "ANTHROPIC_AUTH_TOKEN": "${{ secrets.CUSTOM_ENDPOINT_API_KEY }}"
+            }
+          }
+          EOF
+
+      - name: Run Claude Code
+        id: claude
+        uses: anthropics/claude-code-action@v1
+        with:
+          # Still need this to satisfy the action's validation
+          anthropic_api_key: ${{ secrets.CUSTOM_ENDPOINT_API_KEY }}
+
+          # Use the same variable names as your local setup
+          settings: '{"env": {"ANTHROPIC_BASE_URL": "https://api.z.ai/api/anthropic", "ANTHROPIC_AUTH_TOKEN": "${{ secrets.CUSTOM_ENDPOINT_API_KEY }}"}}'
+
+          track_progress: true
+          claude_args: |
+            --allowedTools "Bash,Edit,Read,Write,Glob,Grep"
diff --git a/.github/workflows/cosqa-benchmark.yml b/.github/workflows/cosqa-benchmark.yml
@@ -0,0 +1,147 @@
+name: CoSQA Search Benchmark
+
+on:
+  workflow_dispatch:
+    inputs:
+      enforce_hybrid_gate:
+        description: Fail run if best hybrid underperforms best dense past threshold
+        required: false
+        default: false
+        type: boolean
+      hybrid_min_delta:
+        description: Minimum accepted (hybrid_mrr - dense_mrr), e.g. -0.02
+        required: false
+        default: "-0.02"
+        type: string
+      upload_full_artifacts:
+        description: Upload full logs/json bundle (higher storage usage)
+        required: false
+        default: false
+        type: boolean
+
+  pull_request:
+    branches: [ test ]
+    paths:
+      - scripts/hybrid/**
+      - scripts/hybrid_search.py
+      - scripts/mcp_impl/search.py
+      - scripts/mcp_impl/context_search.py
+      - scripts/mcp_indexer_server.py
+      - scripts/benchmarks/cosqa/**
+      - .github/workflows/cosqa-benchmark.yml
+
+  schedule:
+    - cron: "25 3 * * *"
+
+jobs:
+  cosqa-bench:
+    runs-on: ubuntu-latest
+    timeout-minutes: 360
+
+    services:
+      qdrant:
+        image: qdrant/qdrant:v1.15.1
+        ports:
+          - 6333:6333
+
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+
+      - name: Cache pip
+        uses: actions/cache@v4
+        with:
+          path: ~/.cache/pip
+          key: ${{ runner.os }}-pip-${{ hashFiles('**/requirements*.txt', '**/pyproject.toml') }}
+          restore-keys: |
+            ${{ runner.os }}-pip-
+
+      - name: Cache HuggingFace datasets
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cache/huggingface/datasets
+            ~/.cache/huggingface/hub
+          key: ${{ runner.os }}-hf-cosqa-${{ hashFiles('scripts/benchmarks/cosqa/dataset.py') }}
+          restore-keys: |
+            ${{ runner.os }}-hf-cosqa-
+            ${{ runner.os }}-hf-
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install -r requirements.txt
+          pip install "datasets>=2.18.0"
+
+      - name: Wait for Qdrant
+        run: |
+          timeout 90 bash -c 'until curl -fsS http://localhost:6333/readyz; do sleep 2; done'
+          curl -fsS http://localhost:6333/collections >/dev/null
+
+      - name: Resolve run config
+        id: cfg
+        run: |
+          echo "profile=full" >> "$GITHUB_OUTPUT"
+          echo "run_set=full" >> "$GITHUB_OUTPUT"
+          if [ "${{ github.event_name }}" = "workflow_dispatch" ] && [ "${{ inputs.enforce_hybrid_gate }}" = "true" ]; then
+            echo "enforce_hybrid_gate=1" >> "$GITHUB_OUTPUT"
+          else
+            echo "enforce_hybrid_gate=0" >> "$GITHUB_OUTPUT"
+          fi
+          if [ "${{ github.event_name }}" = "workflow_dispatch" ] && [ "${{ inputs.hybrid_min_delta }}" != "" ]; then
+            echo "hybrid_min_delta=${{ inputs.hybrid_min_delta }}" >> "$GITHUB_OUTPUT"
+          else
+            echo "hybrid_min_delta=-0.02" >> "$GITHUB_OUTPUT"
+          fi
+
+      - name: Run CoSQA search matrix
+        id: bench
+        env:
+          QDRANT_URL: http://localhost:6333
+          PROFILE: ${{ steps.cfg.outputs.profile }}
+          RUN_SET: ${{ steps.cfg.outputs.run_set }}
+          ENFORCE_HYBRID_GATE: ${{ steps.cfg.outputs.enforce_hybrid_gate }}
+          HYBRID_MIN_DELTA: ${{ steps.cfg.outputs.hybrid_min_delta }}
+          PYTHONUNBUFFERED: "1"
+        run: |
+          RUN_TAG="gha-${{ github.run_id }}-${{ github.run_attempt }}"
+          OUT_DIR="bench_results/cosqa/${RUN_TAG}"
+          echo "out_dir=${OUT_DIR}" >> "$GITHUB_OUTPUT"
+          RUN_TAG="${RUN_TAG}" OUT_DIR="${OUT_DIR}" ./scripts/benchmarks/cosqa/run_search_matrix.sh
+
+      - name: Publish benchmark summary
+        if: always()
+        run: |
+          SUMMARY="${{ steps.bench.outputs.out_dir }}/summary.md"
+          if [ -f "${SUMMARY}" ]; then
+            cat "${SUMMARY}" >> "$GITHUB_STEP_SUMMARY"
+          else
+            echo "No summary file generated" >> "$GITHUB_STEP_SUMMARY"
+          fi
+
+      - name: Upload benchmark artifacts
+        if: always() && github.event_name == 'pull_request'
+        uses: actions/upload-artifact@v4
+        with:
+          name: cosqa-search-summary-${{ github.run_id }}-${{ github.run_attempt }}
+          path: |
+            ${{ steps.bench.outputs.out_dir }}/summary.md
+            ${{ steps.bench.outputs.out_dir }}/summary.json
+          retention-days: 3
+
+      - name: Upload full benchmark artifacts
+        if: |
+          always() && (
+            github.event_name == 'schedule' ||
+            (github.event_name == 'workflow_dispatch' && inputs.upload_full_artifacts == true)
+          )
+        uses: actions/upload-artifact@v4
+        with:
+          name: cosqa-search-bench-${{ github.run_id }}-${{ github.run_attempt }}
+          path: ${{ steps.bench.outputs.out_dir }}
+          retention-days: 7