bdsp-core
diff --git a/‎SETUP_GOOGLE_SHEETS_SYNC.md‎
Lines changed: 52 additions & 0 deletions b/‎SETUP_GOOGLE_SHEETS_SYNC.md‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎extract_team_simple.py‎
Lines changed: 100 additions & 0 deletions b/‎extract_team_simple.py‎
Lines changed: 100 additions & 0 deletions
diff --git a/‎extract_team_to_csv.py‎
Lines changed: 80 additions & 0 deletions b/‎extract_team_to_csv.py‎
Lines changed: 80 additions & 0 deletions
@@ -0,0 +1,52 @@
+# Google Sheets Team Sync Setup Guide
+
+## Using Service Account (Recommended)
+
+### Step 1: Create Service Account
+1. Go to [Google Cloud Console](https://console.cloud.google.com/)
+2. Navigate to **IAM & Admin** → **Service Accounts**
+3. Click **+ CREATE SERVICE ACCOUNT**
+4. Name it something like "sheets-sync"
+5. Click **Create and Continue** (skip optional steps)
+6. Click **Done**
+
+### Step 2: Create and Download Key
+1. Click on your new service account
+2. Go to **Keys** tab
+3. Click **ADD KEY** → **Create new key**
+4. Choose **JSON** format
+5. Download the file and rename it to `service-account-key.json`
+6. Place it in your repository root (it's already in .gitignore)
+
+### Step 3: Get Service Account Email
+1. Copy the service account email (looks like: `sheets-sync@your-project.iam.gserviceaccount.com`)
+
+### Step 4: Share Google Sheet
+1. Open your Google Sheet
+2. Click **Share** button
+3. Paste the service account email
+4. Give it **Viewer** access
+5. Click **Send**
+
+### Step 5: Run the Sync
+```bash
+cd "/Users/bwestove/cdac Dropbox/brandon westover/0_GithubRepos/bdsp-core.github.io"
+source venv/bin/activate
+python sync_team_service_account.py
+```
+
+## Google Sheet Format
+Your sheet should have these columns:
+- Name
+- Link (optional URL)
+- Photo (filename)
+- Position
+- Email
+- Education1
+- Education2
+- Education3
+- Education4
+- Category (must be one of: Faculty, Alumni, Postdocs/Students/Staff, Collaborators)
+
+## Automation with GitHub Actions
+Once the manual sync works, the GitHub Action will use the same service account to sync automatically.
@@ -0,0 +1,100 @@
+#!/usr/bin/env python3
+"""Extract team data from YAML files to CSV - simple version without dependencies."""
+
+import re
+import csv
+
+def parse_yaml_simple(filename):
+    """Simple YAML parser for the specific structure we have."""
+    members = []
+    current_member = {}
+    
+    try:
+        with open(filename, 'r') as f:
+            lines = f.readlines()
+        
+        for line in lines:
+            line = line.rstrip()
+            
+            # New member starts with "- name:"
+            if line.startswith('- name:'):
+                if current_member:
+                    members.append(current_member)
+                current_member = {}
+                # Extract name value
+                name_value = line[7:].strip()
+                current_member['name'] = name_value
+            
+            # Other fields
+            elif line.startswith('  '):
+                if ':' in line:
+                    key, value = line.strip().split(':', 1)
+                    current_member[key.strip()] = value.strip()
+        
+        # Don't forget the last member
+        if current_member:
+            members.append(current_member)
+            
+    except FileNotFoundError:
+        print(f"Warning: {filename} not found")
+        
+    return members
+
+def extract_link_and_name(name_field):
+    """Extract URL and clean name from HTML link if present."""
+    # Check if it's an HTML link
+    match = re.match(r'<a href="([^"]+)">([^<]+)</?a?/?>', name_field)
+    if match:
+        return match.group(2).strip(), match.group(1).strip()
+    return name_field.strip(), ""
+
+def main():
+    """Extract all team data to CSV."""
+    all_rows = []
+    
+    # Process each category
+    categories = [
+        ('_data/faculty.yml', 'Faculty'),
+        ('_data/postdocsStudentsStaff.yml', 'Postdocs, Students, Staff'),
+        ('_data/alumni.yml', 'Alumni'),
+        ('_data/collaborators.yml', 'Collaborators')
+    ]
+    
+    for yaml_file, category in categories:
+        members = parse_yaml_simple(yaml_file)
+        
+        for member in members:
+            # Extract name and link
+            name, link = extract_link_and_name(member.get('name', ''))
+            
+            # Build row
+            row = {
+                'Name': name,
+                'Link': link,
+                'Photo': member.get('photo', ''),
+                'Position': member.get('info', ''),
+                'Email': member.get('email', ''),
+                'Education1': member.get('education1', ''),
+                'Education2': member.get('education2', ''),
+                'Education3': member.get('education3', ''),
+                'Education4': member.get('education4', ''),
+                'Category': category
+            }
+            all_rows.append(row)
+        
+        print(f"Extracted {len(members)} members from {yaml_file}")
+    
+    # Write to CSV
+    fieldnames = ['Name', 'Link', 'Photo', 'Position', 'Email', 
+                  'Education1', 'Education2', 'Education3', 'Education4', 'Category']
+    
+    with open('team_data.csv', 'w', newline='', encoding='utf-8') as csvfile:
+        writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
+        writer.writeheader()
+        writer.writerows(all_rows)
+    
+    print(f"\nTotal: {len(all_rows)} team members exported to team_data.csv")
+    print("\nYou can now copy the contents of team_data.csv to your Google Sheet!")
+
+if __name__ == '__main__':
+    main()
@@ -0,0 +1,80 @@
+#!/usr/bin/env python3
+"""Extract team data from YAML files to CSV for Google Sheets import."""
+
+import yaml
+import csv
+import re
+
+def extract_link_and_name(name_field):
+    """Extract URL and clean name from HTML link if present."""
+    # Check if it's an HTML link
+    match = re.match(r'<a href="([^"]+)">([^<]+)</?a?/?>', name_field)
+    if match:
+        return match.group(2).strip(), match.group(1).strip()
+    return name_field.strip(), ""
+
+def yaml_to_rows(yaml_file, category):
+    """Convert YAML data to rows for CSV."""
+    rows = []
+    
+    try:
+        with open(f'_data/{yaml_file}', 'r') as f:
+            data = yaml.safe_load(f)
+            
+        if not data:
+            return rows
+            
+        for member in data:
+            # Extract name and link
+            name, link = extract_link_and_name(member.get('name', ''))
+            
+            # Build row
+            row = {
+                'Name': name,
+                'Link': link,
+                'Photo': member.get('photo', ''),
+                'Position': member.get('info', ''),
+                'Email': member.get('email', ''),
+                'Education1': member.get('education1', ''),
+                'Education2': member.get('education2', ''),
+                'Education3': member.get('education3', ''),
+                'Education4': member.get('education4', ''),
+                'Category': category
+            }
+            rows.append(row)
+            
+    except FileNotFoundError:
+        print(f"Warning: {yaml_file} not found")
+        
+    return rows
+
+def main():
+    """Extract all team data to CSV."""
+    all_rows = []
+    
+    # Process each category
+    categories = [
+        ('faculty.yml', 'Faculty'),
+        ('postdocsStudentsStaff.yml', 'Postdocs, Students, Staff'),
+        ('alumni.yml', 'Alumni'),
+        ('collaborators.yml', 'Collaborators')
+    ]
+    
+    for yaml_file, category in categories:
+        rows = yaml_to_rows(yaml_file, category)
+        all_rows.extend(rows)
+        print(f"Extracted {len(rows)} members from {yaml_file}")
+    
+    # Write to CSV
+    fieldnames = ['Name', 'Link', 'Photo', 'Position', 'Email', 
+                  'Education1', 'Education2', 'Education3', 'Education4', 'Category']
+    
+    with open('team_data.csv', 'w', newline='', encoding='utf-8') as csvfile:
+        writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
+        writer.writeheader()
+        writer.writerows(all_rows)
+    
+    print(f"\nTotal: {len(all_rows)} team members exported to team_data.csv")
+
+if __name__ == '__main__':
+    main()