Files
awesome-chatgpt-prompts-pro…/scripts/generate-contributors.sh

431 lines
16 KiB
Bash
Executable File

#!/bin/bash
# Script to generate contributor commits from prompts.csv
# Fetches latest prompts from prompts.chat/prompts.csv
# Compares with existing prompts.csv and creates commits only for new prompts
set -e
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
PROJECT_DIR="$(dirname "$SCRIPT_DIR")"
CSV_FILE="$PROJECT_DIR/prompts.csv"
REMOTE_CSV="$PROJECT_DIR/prompts.csv.remote"
REMOTE_CSV_URL="https://prompts.chat/prompts.csv"
# Fetch latest prompts.csv from prompts.chat
echo "Fetching latest prompts.csv from $REMOTE_CSV_URL..."
if ! curl -fsSL "$REMOTE_CSV_URL" -o "$REMOTE_CSV"; then
echo "Error: Failed to fetch prompts.csv from $REMOTE_CSV_URL"
echo "Make sure prompts.chat is running and the endpoint is available."
exit 1
fi
echo "Successfully fetched remote prompts.csv"
# Initialize local CSV if it doesn't exist
if [ ! -f "$CSV_FILE" ]; then
echo "Local prompts.csv not found, initializing with header..."
head -1 "$REMOTE_CSV" > "$CSV_FILE"
git add "$CSV_FILE"
git commit -m "Initialize prompts.csv with header" --allow-empty 2>/dev/null || true
fi
echo ""
echo "Comparing local and remote prompts.csv..."
# Process diffs and create commits for new prompts
export PROJECT_DIR
set +e # Temporarily allow non-zero exit
python3 << 'PYTHON_SCRIPT'
import csv
import subprocess
import os
import io
import sys
# Increase CSV field size limit to handle large prompt content
csv.field_size_limit(sys.maxsize)
project_dir = os.environ.get('PROJECT_DIR', '.')
csv_file = os.path.join(project_dir, 'prompts.csv')
remote_csv = os.path.join(project_dir, 'prompts.csv.remote')
# Read existing local prompts (by act title as key)
local_prompts = {}
fieldnames = None
skipped_local = 0
with open(csv_file, 'r', newline='', encoding='utf-8') as f:
# Normalize CRLF to LF
content = f.read().replace('\r\n', '\n').replace('\r', '\n')
reader = csv.DictReader(io.StringIO(content))
fieldnames = reader.fieldnames
for row in reader:
try:
act = row.get('act', '').strip()
if act:
local_prompts[act] = row
except csv.Error as e:
skipped_local += 1
print(f"Skipping local row due to CSV error: {e}")
print(f"Found {len(local_prompts)} existing local prompts" + (f" (skipped {skipped_local})" if skipped_local else ""))
# Read remote prompts (normalize CRLF to LF)
remote_prompts = []
skipped_remote = 0
with open(remote_csv, 'r', newline='', encoding='utf-8') as f:
content = f.read().replace('\r\n', '\n').replace('\r', '\n')
reader = csv.DictReader(io.StringIO(content))
remote_fieldnames = reader.fieldnames
while True:
try:
row = next(reader)
remote_prompts.append(row)
except csv.Error as e:
skipped_remote += 1
print(f"Skipping remote row due to CSV error: {e}")
except StopIteration:
break
print(f"Found {len(remote_prompts)} remote prompts" + (f" (skipped {skipped_remote})" if skipped_remote else ""))
# Use remote fieldnames if local is empty
if not fieldnames:
fieldnames = remote_fieldnames
# Build set of remote prompt acts for quick lookup
remote_acts = set()
for row in remote_prompts:
act = row.get('act', '').strip()
if act:
remote_acts.add(act)
# Find new, updated, and deleted prompts
new_prompts = []
updated_prompts = []
deleted_prompts = []
# Check for new and updated
for row in remote_prompts:
act = row.get('act', '').strip()
if not act:
continue
if act not in local_prompts:
new_prompts.append(row)
else:
local_row = local_prompts[act]
# Check if content OR contributors changed
content_changed = row.get('prompt', '').strip() != local_row.get('prompt', '').strip()
contributors_changed = row.get('contributor', '').strip() != local_row.get('contributor', '').strip()
if content_changed or contributors_changed:
updated_prompts.append((row, local_row))
# Check for deleted (in local but not in remote)
for act, local_row in local_prompts.items():
if act not in remote_acts:
deleted_prompts.append(local_row)
print(f"Found {len(new_prompts)} new prompts to add")
print(f"Found {len(updated_prompts)} updated prompts to modify")
print(f"Found {len(deleted_prompts)} prompts to remove (unlisted/deleted)")
# Helper function to parse contributors (supports "user1,user2,user3" format)
def parse_contributors(contributor_field):
"""Parse contributor field, returns (primary_author, co_authors_list)"""
if not contributor_field:
return 'anonymous', []
# Split by comma and clean up
contributors = [c.strip() for c in contributor_field.split(',') if c.strip()]
if not contributors:
return 'anonymous', []
primary = contributors[0]
co_authors = contributors[1:] if len(contributors) > 1 else []
return primary, co_authors
def build_commit_message(action, act, co_authors):
"""Build commit message with optional co-author trailers"""
msg = f'{action} prompt: {act}'
if co_authors:
msg += '\n\n'
for co_author in co_authors:
co_email = f"{co_author}@users.noreply.github.com"
msg += f'Co-authored-by: {co_author} <{co_email}>\n'
return msg
def format_contributor_links(contributor_field):
"""Format contributors as GitHub profile links"""
if not contributor_field:
return '@anonymous'
contributors = [c.strip() for c in contributor_field.split(',') if c.strip()]
if not contributors:
return '@anonymous'
return ', '.join([f'[@{c}](https://github.com/{c})' for c in contributors])
def generate_prompt_block(row):
"""Generate a single prompt's <details> block"""
act = row.get('act', 'Untitled')
prompt = row.get('prompt', '')
contributor = row.get('contributor', '')
prompt_type = row.get('type', 'TEXT').upper()
# Determine code block language based on type
if prompt_type == 'TEXT':
lang = 'md'
elif prompt_type == 'JSON':
lang = 'json'
elif prompt_type == 'YAML':
lang = 'yaml'
else:
lang = 'md'
contributor_links = format_contributor_links(contributor)
block = f'<details>\n'
block += f'<summary><strong>{act}</strong></summary>\n\n'
block += f'## {act}\n\n'
block += f'Contributed by {contributor_links}\n\n'
block += f'```{lang}\n'
block += f'{prompt}\n'
block += f'```\n\n'
block += f'</details>\n\n'
return block
def init_prompts_md(prompts_md_path):
"""Initialize PROMPTS.md with header if it doesn't exist"""
if not os.path.exists(prompts_md_path):
with open(prompts_md_path, 'w', encoding='utf-8') as f:
f.write('# prompts.chat\n\n')
f.write('> A curated list of prompts for ChatGPT and other AI models.\n\n')
f.write('---\n\n')
def append_prompt_to_md(row, prompts_md_path):
"""Append a new prompt block to PROMPTS.md"""
init_prompts_md(prompts_md_path)
block = generate_prompt_block(row)
with open(prompts_md_path, 'a', encoding='utf-8') as f:
f.write(block)
def update_prompt_in_md(row, prompts_md_path):
"""Update an existing prompt's block in PROMPTS.md"""
act = row.get('act', '')
if not os.path.exists(prompts_md_path):
append_prompt_to_md(row, prompts_md_path)
return
with open(prompts_md_path, 'r', encoding='utf-8') as f:
content = f.read()
# Find and replace the specific prompt block using regex
import re
# Pattern to match the entire <details> block for this prompt
pattern = rf'<details>\n<summary><strong>{re.escape(act)}</strong></summary>.*?</details>\n\n'
new_block = generate_prompt_block(row)
new_content, count = re.subn(pattern, new_block, content, flags=re.DOTALL)
if count > 0:
with open(prompts_md_path, 'w', encoding='utf-8') as f:
f.write(new_content)
else:
# Prompt not found, append it
append_prompt_to_md(row, prompts_md_path)
def remove_prompt_from_md(act, prompts_md_path):
"""Remove a prompt's block from PROMPTS.md"""
if not os.path.exists(prompts_md_path):
return
with open(prompts_md_path, 'r', encoding='utf-8') as f:
content = f.read()
import re
pattern = rf'<details>\n<summary><strong>{re.escape(act)}</strong></summary>.*?</details>\n\n'
new_content = re.sub(pattern, '', content, flags=re.DOTALL)
with open(prompts_md_path, 'w', encoding='utf-8') as f:
f.write(new_content)
prompts_md_path = os.path.join(project_dir, 'PROMPTS.md')
if not new_prompts and not updated_prompts and not deleted_prompts:
print("\nNo CSV changes detected. Already up to date!")
else:
# Process updates one at a time (apply and commit each update separately)
if updated_prompts:
print("\nApplying updates to existing prompts...")
for i, (remote_row, local_row) in enumerate(updated_prompts, 1):
act = remote_row.get('act', '').strip()
contributor_field = remote_row.get('contributor', '').strip()
# Update this specific prompt in local_prompts
local_prompts[act] = remote_row
# Rewrite the CSV with this update applied
with open(csv_file, 'w', newline='') as f:
writer = csv.DictWriter(f, fieldnames=fieldnames)
writer.writeheader()
# Write in order of remote (to maintain order)
for row in remote_prompts:
row_act = row.get('act', '').strip()
if row_act in local_prompts:
writer.writerow(local_prompts[row_act])
# Update only this prompt's block in PROMPTS.md
update_prompt_in_md(remote_row, prompts_md_path)
primary_author, co_authors = parse_contributors(contributor_field)
email = f"{primary_author}@users.noreply.github.com"
subprocess.run(['git', 'add', csv_file, prompts_md_path], check=True)
# Check if there are actual changes to commit
diff_result = subprocess.run(['git', 'diff', '--cached', '--quiet'], capture_output=True)
if diff_result.returncode == 0:
# No changes staged, skip this commit
print(f"[UPDATE {i}/{len(updated_prompts)}] {act} - no changes, skipping")
continue
env = os.environ.copy()
env['GIT_AUTHOR_NAME'] = primary_author
env['GIT_AUTHOR_EMAIL'] = email
env['GIT_COMMITTER_NAME'] = primary_author
env['GIT_COMMITTER_EMAIL'] = email
commit_msg = build_commit_message('Update', act, co_authors)
subprocess.run([
'git', 'commit',
'-m', commit_msg,
f'--author={primary_author} <{email}>'
], env=env, check=True)
co_authors_str = f" (+ {', '.join(co_authors)})" if co_authors else ""
print(f"[UPDATE {i}/{len(updated_prompts)}] {primary_author}{co_authors_str}: {act}")
# Process new prompts
if new_prompts:
print("\nCreating commits for new prompts...")
for i, row in enumerate(new_prompts, 1):
contributor_field = row.get('contributor', '').strip()
act = row.get('act', 'Unknown')
primary_author, co_authors = parse_contributors(contributor_field)
email = f"{primary_author}@users.noreply.github.com"
# Append this row to the CSV
with open(csv_file, 'a', newline='') as f:
writer = csv.DictWriter(f, fieldnames=fieldnames)
writer.writerow(row)
# Track in local_prompts
local_prompts[act] = row
# Append only this prompt's block to PROMPTS.md
append_prompt_to_md(row, prompts_md_path)
# Stage and commit
subprocess.run(['git', 'add', csv_file, prompts_md_path], check=True)
# Check if there are actual changes to commit
diff_result = subprocess.run(['git', 'diff', '--cached', '--quiet'], capture_output=True)
if diff_result.returncode == 0:
print(f"[NEW {i}/{len(new_prompts)}] {act} - no changes, skipping")
continue
env = os.environ.copy()
env['GIT_AUTHOR_NAME'] = primary_author
env['GIT_AUTHOR_EMAIL'] = email
env['GIT_COMMITTER_NAME'] = primary_author
env['GIT_COMMITTER_EMAIL'] = email
commit_msg = build_commit_message('Add', act, co_authors)
subprocess.run([
'git', 'commit',
'-m', commit_msg,
f'--author={primary_author} <{email}>'
], env=env, check=True)
co_authors_str = f" (+ {', '.join(co_authors)})" if co_authors else ""
print(f"[NEW {i}/{len(new_prompts)}] {primary_author}{co_authors_str}: {act}")
# Process deleted prompts (remove from CSV, commit with original author)
if deleted_prompts:
print("\nRemoving unlisted/deleted prompts...")
for i, row in enumerate(deleted_prompts, 1):
contributor_field = row.get('contributor', '').strip()
act = row.get('act', 'Unknown')
primary_author, co_authors = parse_contributors(contributor_field)
email = f"{primary_author}@users.noreply.github.com"
# Remove this prompt from local_prompts
if act in local_prompts:
del local_prompts[act]
# Rewrite CSV without the deleted prompt
with open(csv_file, 'w', newline='') as f:
writer = csv.DictWriter(f, fieldnames=fieldnames)
writer.writeheader()
for remaining_act, remaining_row in local_prompts.items():
writer.writerow(remaining_row)
# Remove only this prompt's block from PROMPTS.md
remove_prompt_from_md(act, prompts_md_path)
# Stage and commit
subprocess.run(['git', 'add', csv_file, prompts_md_path], check=True)
# Check if there are actual changes to commit
diff_result = subprocess.run(['git', 'diff', '--cached', '--quiet'], capture_output=True)
if diff_result.returncode == 0:
print(f"[REMOVE {i}/{len(deleted_prompts)}] {act} - no changes, skipping")
continue
env = os.environ.copy()
env['GIT_AUTHOR_NAME'] = primary_author
env['GIT_AUTHOR_EMAIL'] = email
env['GIT_COMMITTER_NAME'] = primary_author
env['GIT_COMMITTER_EMAIL'] = email
commit_msg = build_commit_message('Remove', act, co_authors)
subprocess.run([
'git', 'commit',
'-m', commit_msg,
f'--author={primary_author} <{email}>'
], env=env, check=True)
co_authors_str = f" (+ {', '.join(co_authors)})" if co_authors else ""
print(f"[REMOVE {i}/{len(deleted_prompts)}] {primary_author}{co_authors_str}: {act}")
print(f"\nDone! Created {len(new_prompts)} new, {len(updated_prompts)} update, {len(deleted_prompts)} remove commits.")
PYTHON_SCRIPT
PYTHON_EXIT=$?
set -e # Re-enable exit on error
# Clean up
rm -f "$REMOTE_CSV"
# Check for actual Python errors
if [ $PYTHON_EXIT -ne 0 ]; then
echo "Error: Script failed with exit code $PYTHON_EXIT"
exit 1
fi
echo ""
echo "Review with: git log --oneline prompts.csv PROMPTS.md"
echo ""
echo "To push: git push origin main"