generated from nhcarrigan/template
ec58c9c843
CI / dependency-pin-check-typescript (push) Successful in 5s
CI / dependency-pin-check-python (push) Successful in 4s
CI / python (push) Successful in 9m28s
CI / typescript (push) Successful in 9m42s
Security Scan and Upload / Security & DefectDojo Upload (push) Successful in 1m39s
## Summary This PR completes the bash script restructuring and adds comprehensive documentation across all script categories. ### Bash Restructuring - Moved cohort shell scripts (`remove_github_members.sh`, `update_github_teams.sh`) from `python/cohort/` into a new `bash/cohort/` directory - Moved existing bash utilities (`add-keys-to-git.sh`, `fix-yubikey-perms.sh`, `list-yubikey-ssh-keys.sh`) into a new `bash/yubikey/` subdirectory - Updated `run.sh` to support **Bash** as a third language option alongside TypeScript and Python - Bash scripts are run directly (no 1Password secret injection needed) - Category discovery and script listing works the same as for TS/Python - Removed dead "Root Scripts" logic that was no longer needed ### Documentation Added `README.md` files for all script categories that were missing them: - `bash/cohort/README.md` — cohort GitHub team management scripts - `bash/yubikey/README.md` — YubiKey SSH key and permission utilities - `typescript/src/crowdin/README.md` — Crowdin translation management scripts - `typescript/src/discord/README.md` — Discord bot utility scripts - `typescript/src/discourse/README.md` — Discourse forum management scripts - `typescript/src/gitea/README.md` — Gitea bulk repository operation scripts - `typescript/src/github/README.md` — GitHub API interaction scripts - `typescript/src/music/README.md` — Music file metadata tools - `typescript/src/s3/README.md` — S3-compatible object storage scripts - `typescript/src/security/README.md` — Security analysis and reporting scripts - `python/cohort/README.md` — Updated to remove moved shell scripts, fix usage commands Also updated project-level docs: - **`README.md`** — Corrected project structure, fixed running instructions (removed references to non-existent `make run-ts`/`make run-py` targets), added Bash prerequisites - **`CLAUDE.md`** — Updated project overview, structure, development standards, and script-adding guides to reflect the current state of the project ✨ This PR was created with help from Hikari~ 🌸 Co-authored-by: Naomi Carrigan <commits@nhcarrigan.com> Reviewed-on: #6 Co-authored-by: Hikari <hikari@nhcarrigan.com> Co-committed-by: Hikari <hikari@nhcarrigan.com>
129 lines
4.3 KiB
Python
129 lines
4.3 KiB
Python
"""Verify Discord user IDs from a markdown table of applicant data.
|
|
|
|
Reads a markdown table containing Discord IDs and checks each one against the
|
|
Discord API to confirm the user exists. Handles rate limits automatically.
|
|
|
|
Data files (place in data/):
|
|
- table.md Markdown table of applicants including a Discord ID column
|
|
|
|
Outputs (written to data/):
|
|
- discord_verification.json Verification result (valid/invalid) per Discord ID
|
|
|
|
Env vars:
|
|
- DISCORD_BOT_TOKEN Bot token for the Discord API
|
|
"""
|
|
|
|
import json
|
|
import os
|
|
import time
|
|
import urllib.error
|
|
import urllib.request
|
|
from pathlib import Path
|
|
|
|
DATA_DIR = Path(__file__).parent.parent.parent / "data"
|
|
|
|
# Configuration
|
|
BOT_TOKEN = os.environ["DISCORD_BOT_TOKEN"]
|
|
GUILD_ID = "692816967895220344"
|
|
BASE_URL = "https://discord.com/api/v10"
|
|
|
|
# Read Discord IDs from table.md
|
|
with open(DATA_DIR / "table.md") as f:
|
|
content = f.read()
|
|
|
|
lines = content.strip().split("\n")
|
|
|
|
# Find the table header line (starts with |)
|
|
header_line = None
|
|
header_idx = 0
|
|
for i, line in enumerate(lines):
|
|
if line.startswith("| Discord"):
|
|
header_line = line
|
|
header_idx = i
|
|
break
|
|
|
|
if not header_line:
|
|
print("Could not find table header!")
|
|
exit(1)
|
|
|
|
headers = [h.strip() for h in header_line.split("|")[1:-1]]
|
|
|
|
discord_idx = 0 # Discord ID is the first column
|
|
|
|
discord_ids = []
|
|
for line in lines[header_idx + 2 :]: # Skip header and separator
|
|
if not line.startswith("|"):
|
|
continue
|
|
cols = [c.strip() for c in line.split("|")[1:-1]]
|
|
if len(cols) > discord_idx:
|
|
discord_id = cols[discord_idx].strip()
|
|
if discord_id and discord_id.isdigit():
|
|
discord_ids.append(discord_id)
|
|
|
|
print(f"Found {len(discord_ids)} Discord IDs to verify")
|
|
|
|
# Verify each ID against the guild
|
|
verified = []
|
|
missing = []
|
|
errors = []
|
|
|
|
for i, discord_id in enumerate(discord_ids):
|
|
url = f"{BASE_URL}/guilds/{GUILD_ID}/members/{discord_id}"
|
|
req = urllib.request.Request(url)
|
|
req.add_header("Authorization", f"Bot {BOT_TOKEN}")
|
|
|
|
try:
|
|
response = urllib.request.urlopen(req)
|
|
data = json.loads(response.read().decode())
|
|
username = data.get("user", {}).get("username", "Unknown")
|
|
verified.append((discord_id, username))
|
|
print(f"[{i + 1}/{len(discord_ids)}] ✓ {discord_id} - {username}")
|
|
except urllib.error.HTTPError as e:
|
|
if e.code == 404:
|
|
missing.append(discord_id)
|
|
print(f"[{i + 1}/{len(discord_ids)}] ✗ {discord_id} - NOT IN SERVER")
|
|
elif e.code == 429:
|
|
# Rate limited - wait and retry
|
|
retry_after = json.loads(e.read().decode()).get("retry_after", 1)
|
|
print(
|
|
f"[{i + 1}/{len(discord_ids)}] Rate limited, waiting {retry_after}s..."
|
|
)
|
|
time.sleep(retry_after + 0.5)
|
|
# Retry
|
|
try:
|
|
req2 = urllib.request.Request(url)
|
|
req2.add_header("Authorization", f"Bot {BOT_TOKEN}")
|
|
response = urllib.request.urlopen(req2)
|
|
data = json.loads(response.read().decode())
|
|
username = data.get("user", {}).get("username", "Unknown")
|
|
verified.append((discord_id, username))
|
|
msg = f"[{i + 1}/{len(discord_ids)}] ✓ {discord_id}"
|
|
print(f"{msg} - {username} (after retry)")
|
|
except urllib.error.HTTPError as e2:
|
|
if e2.code == 404:
|
|
missing.append(discord_id)
|
|
msg = f"[{i + 1}/{len(discord_ids)}] ✗ {discord_id}"
|
|
print(f"{msg} - NOT IN SERVER (after retry)")
|
|
else:
|
|
errors.append((discord_id, f"HTTP {e2.code}"))
|
|
print(
|
|
f"[{i + 1}/{len(discord_ids)}] ? {discord_id} - Error {e2.code}"
|
|
)
|
|
else:
|
|
errors.append((discord_id, f"HTTP {e.code}"))
|
|
print(f"[{i + 1}/{len(discord_ids)}] ? {discord_id} - Error {e.code}")
|
|
|
|
# Small delay to avoid rate limits
|
|
time.sleep(0.1)
|
|
|
|
print("\n=== SUMMARY ===")
|
|
print(f"Verified: {len(verified)}")
|
|
print(f"Missing: {len(missing)}")
|
|
print(f"Errors: {len(errors)}")
|
|
|
|
# Save results
|
|
with open(DATA_DIR / "discord_verification.json", "w") as f:
|
|
json.dump({"verified": verified, "missing": missing, "errors": errors}, f, indent=2)
|
|
|
|
print("\nResults saved to discord_verification.json")
|