#!/usr/bin/env bash
# gstack-learnings-search — read and filter project learnings
# Usage: gstack-learnings-search [--type TYPE] [--query KEYWORD] [--limit N] [--cross-project]
#
# Reads ~/.gstack/projects/$SLUG/learnings.jsonl, applies confidence decay,
# resolves duplicates (latest winner per key+type), and outputs formatted text.
# Exit 0 silently if no learnings file exists.
set -euo pipefail
SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
eval "$("$SCRIPT_DIR/gstack-slug" 2>/dev/null)"
GSTACK_HOME="${GSTACK_HOME:-$HOME/.gstack}"

TYPE=""
QUERY=""
LIMIT=10
CROSS_PROJECT=false

while [[ $# -gt 0 ]]; do
  case "$1" in
    --type) TYPE="$2"; shift 2 ;;
    --query) QUERY="$2"; shift 2 ;;
    --limit) LIMIT="$2"; shift 2 ;;
    --cross-project) CROSS_PROJECT=true; shift ;;
    *) shift ;;
  esac
done

LEARNINGS_FILE="$GSTACK_HOME/projects/$SLUG/learnings.jsonl"

# Collect cross-project JSONL files separately so the trust gate can distinguish
# current-project rows from rows loaded from other projects.
CROSS_FILES=()

if [ "$CROSS_PROJECT" = true ]; then
  # Add other projects' learnings (max 5)
  while IFS= read -r f; do
    CROSS_FILES+=("$f")
    [ ${#CROSS_FILES[@]} -ge 5 ] && break
  done < <(find "$GSTACK_HOME/projects" -name "learnings.jsonl" -not -path "*/$SLUG/*" 2>/dev/null)
fi

if [ ! -f "$LEARNINGS_FILE" ] && [ ${#CROSS_FILES[@]} -eq 0 ]; then
  exit 0
fi

emit_tagged_file() {
  local tag="$1"
  local file="$2"
  local line
  while IFS= read -r line || [ -n "$line" ]; do
    [ -n "$line" ] && printf '%s\t%s\n' "$tag" "$line"
  done < "$file"
}

# Process all files through bun for JSON parsing, decay, dedup, filtering
{
  [ -f "$LEARNINGS_FILE" ] && emit_tagged_file current "$LEARNINGS_FILE"
  if [ ${#CROSS_FILES[@]} -gt 0 ]; then
    for f in "${CROSS_FILES[@]}"; do
      emit_tagged_file cross "$f"
    done
  fi
} | GSTACK_SEARCH_TYPE="$TYPE" GSTACK_SEARCH_QUERY="$QUERY" GSTACK_SEARCH_LIMIT="$LIMIT" GSTACK_SEARCH_CROSS="$CROSS_PROJECT" bun -e "
const lines = (await Bun.stdin.text()).trim().split('\n').filter(Boolean);
const now = Date.now();
const type = process.env.GSTACK_SEARCH_TYPE || '';
const queryRaw = (process.env.GSTACK_SEARCH_QUERY || '').toLowerCase();
const queryTokens = queryRaw.split(/\s+/).filter(Boolean);
const limit = parseInt(process.env.GSTACK_SEARCH_LIMIT || '10', 10);

const entries = [];
for (const taggedLine of lines) {
  try {
    const tabIndex = taggedLine.indexOf('\t');
    const sourceTag = tabIndex === -1 ? 'current' : taggedLine.slice(0, tabIndex);
    const line = tabIndex === -1 ? taggedLine : taggedLine.slice(tabIndex + 1);
    const e = JSON.parse(line);
    if (!e.key || !e.type) continue;

    // Apply confidence decay: observed/inferred lose 1pt per 30 days
    let conf = e.confidence || 5;
    if (e.source === 'observed' || e.source === 'inferred') {
      const days = Math.floor((now - new Date(e.ts).getTime()) / 86400000);
      conf = Math.max(0, conf - Math.floor(days / 30));
    }
    e._effectiveConfidence = conf;

    // Determine if this is from the current project or cross-project
    // Cross-project entries are tagged for display
    const isCrossProject = sourceTag === 'cross';
    e._crossProject = isCrossProject;

    // Trust gate: cross-project learnings only loaded if trusted (user-stated)
    // This prevents prompt injection from one project's AI-generated learnings
    // silently influencing reviews in another project.
    if (isCrossProject && e.trusted === false) continue;

    entries.push(e);
  } catch {}
}

// Dedup: latest winner per key+type
const seen = new Map();
for (const e of entries) {
  const dk = e.key + '|' + e.type;
  const existing = seen.get(dk);
  if (!existing || new Date(e.ts) > new Date(existing.ts)) {
    seen.set(dk, e);
  }
}
let results = Array.from(seen.values());

// Filter by type
if (type) results = results.filter(e => e.type === type);

// Filter by query (token-OR: match if ANY whitespace-split token appears in ANY haystack)
if (queryTokens.length > 0) results = results.filter(e => {
  const haystacks = [(e.key || '').toLowerCase(), (e.insight || '').toLowerCase(), ...(e.files || []).map(f => f.toLowerCase())];
  return queryTokens.some(tok => haystacks.some(h => h.includes(tok)));
});

// Sort by effective confidence desc, then recency
results.sort((a, b) => {
  if (b._effectiveConfidence !== a._effectiveConfidence) return b._effectiveConfidence - a._effectiveConfidence;
  return new Date(b.ts).getTime() - new Date(a.ts).getTime();
});

// Limit
results = results.slice(0, limit);

if (results.length === 0) process.exit(0);

// Format output
const byType = {};
for (const e of results) {
  const t = e.type || 'unknown';
  if (!byType[t]) byType[t] = [];
  byType[t].push(e);
}

// Summary line
const counts = Object.entries(byType).map(([t, arr]) => arr.length + ' ' + t + (arr.length > 1 ? 's' : ''));
console.log('LEARNINGS: ' + results.length + ' loaded (' + counts.join(', ') + ')');
console.log('');

for (const [t, arr] of Object.entries(byType)) {
  console.log('## ' + t.charAt(0).toUpperCase() + t.slice(1) + 's');
  for (const e of arr) {
    const cross = e._crossProject ? ' [cross-project]' : '';
    const files = e.files?.length ? ' (files: ' + e.files.join(', ') + ')' : '';
    console.log('- [' + e.key + '] (confidence: ' + e._effectiveConfidence + '/10, ' + e.source + ', ' + (e.ts || '').split('T')[0] + ')' + cross);
    console.log('  ' + e.insight + files);
  }
  console.log('');
}
" 2>/dev/null || exit 0
