Skip to content
Merged
Show file tree
Hide file tree
Changes from 6 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 3 additions & 3 deletions .agents/plugins/marketplace.json
Original file line number Diff line number Diff line change
@@ -1,11 +1,11 @@
{
"name": "data-cloud-ai-dev-kit-marketplace",
"name": "data-agent-kit-starter-pack-marketplace",
"interface": {
"displayName": "data-cloud-ai-dev-kit Marketplace"
"displayName": "Data Agent Kit Starter Pack Marketplace"
},
"plugins": [
{
"name": "data-cloud-ai-dev-kit",
"name": "data-agent-kit-starter-pack",
"source": {
"source": "local",
"path": "./"
Expand Down
4 changes: 2 additions & 2 deletions .claude-plugin/marketplace.json
Original file line number Diff line number Diff line change
@@ -1,11 +1,11 @@
{
"name": "data-cloud-ai-dev-kit-marketplace",
"name": "data-agent-kit-starter-pack-marketplace",
"owner": {
"name": "Google LLC"
},
"plugins": [
{
"name": "data-cloud-ai-dev-kit",
"name": "data-agent-kit-starter-pack",
"source": "./",
"description": "This plugin provides a specialized suite of skills for data engineers and database practitioners working on Google Cloud. It acts as an expert assistant, allowing you to use natural language prompts in your preferred coding agent to architect complex data pipelines, transform data with dbt, write Spark and BigQuery SQL notebooks, and orchestrate end-to-end workflows across GCP's data ecosystem."
}
Expand Down
2 changes: 1 addition & 1 deletion .claude-plugin/plugin.json
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
{
"name": "data-cloud-ai-dev-kit",
"name": "data-agent-kit-starter-pack",
"version": "0.1.8",
"description": "This plugin provides a specialized suite of skills for data engineers and database practitioners working on Google Cloud. It acts as an expert assistant, allowing you to use natural language prompts in your preferred coding agent to architect complex data pipelines, transform data with dbt, write Spark and BigQuery SQL notebooks, and orchestrate end-to-end workflows across GCP's data ecosystem.",
"mcp": "./.mcp.json"
Expand Down
6 changes: 3 additions & 3 deletions .codex-plugin/plugin.json
Original file line number Diff line number Diff line change
@@ -1,11 +1,11 @@
{
"name": "data-cloud-ai-dev-kit",
"name": "data-agent-kit-starter-pack",
"version": "0.1.8",
"description": "This plugin provides a specialized suite of skills for data engineers and database practitioners working on Google Cloud. It acts as an expert assistant, allowing you to use natural language prompts in your preferred coding agent to architect complex data pipelines, transform data with dbt, write Spark and BigQuery SQL notebooks, and orchestrate end-to-end workflows across GCP's data ecosystem.",
"skills": "./skills/",
"interface": {
"displayName": "Data Cloud AI Dev Kit",
"shortDescription": "Data Cloud AI Dev Kit",
"displayName": "Data Agent Kit Starter Pack",
"shortDescription": "Data Agent Kit Starter Pack",
"category": "Productivity"
},
"mcp": "./.mcp.json"
Expand Down
1 change: 1 addition & 0 deletions .lycheeignore
Original file line number Diff line number Diff line change
@@ -1,4 +1,5 @@
https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit/compare/
https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit
https://raw.githubusercontent.com/gemini-cli-extensions/data-cloud-ai-dev-kit/main/codex-install.sh
https://docs.cloud.google.com/data-cloud-extension/vs-code/install
data-cloud-ai-dev-kit@data-cloud-ai-dev-kit-marketplace
20 changes: 10 additions & 10 deletions .mcp.json
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@
"command": "npx",
"args": [
"-y",
"git+https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit.git"
"git+https://github.com/gemini-cli-extensions/data-agent-kit-starter-pack.git"
],
"env": {},
"env_vars": [
Expand All @@ -20,7 +20,7 @@
"bigquery",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {
"BIGQUERY_LOCATION": "",
Expand All @@ -36,7 +36,7 @@
"spanner",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {
"SPANNER_DATABASE": "",
Expand All @@ -54,7 +54,7 @@
"alloydb-postgres-admin",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {}
},
Expand All @@ -67,7 +67,7 @@
"alloydb-postgres",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
Comment thread
belluru marked this conversation as resolved.
"env": {
"ALLOYDB_POSTGRES_CLUSTER": "",
Expand All @@ -89,7 +89,7 @@
"cloud-sql-postgres-admin",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {}
},
Expand All @@ -102,7 +102,7 @@
"cloud-sql-postgres",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {
"CLOUD_SQL_POSTGRES_DATABASE": "",
Expand All @@ -123,7 +123,7 @@
"dataplex",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {
"DATAPLEX_PROJECT": ""
Expand All @@ -138,7 +138,7 @@
"dataproc",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {
"DATAPROC_PROJECT": "",
Expand All @@ -154,7 +154,7 @@
"serverless-spark",
"--stdio",
"--user-agent-metadata",
"google-cloud-data-agent-kit-claude-and-codex"
"datacloud.claude-and-codex"
],
"env": {
"SERVERLESS_SPARK_PROJECT": "",
Expand Down
8 changes: 4 additions & 4 deletions DEVELOPER.md
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
# DEVELOPER.md

This document provides instructions for setting up your development environment
and contributing to the Cloud SQL for PostgreSQL Gemini CLI Extension project.
and contributing to the Data Agent Kit Starter Pack project.

## Prerequisites

Expand All @@ -22,8 +22,8 @@ The core logic for this extension is handled by a pre-built `toolbox` binary. Th
1. **Clone the Repository:**

```bash
git clone https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit.git
cd data-cloud-ai-dev-kit
git clone https://github.com/gemini-cli-extensions/data-agent-kit-starter-pack.git
cd data-agent-kit-starter-pack
```

2. **Download the Toolbox Binary:** The required version of the `toolbox` binary
Expand All @@ -48,7 +48,7 @@ The core logic for this extension is handled by a pre-built `toolbox` binary. Th
The CLI will prompt you to confirm the installation. Accept it to proceed.

4. **Testing Changes:** After installation, start the Gemini CLI (`gemini`).
You can now interact with the `data-cloud-ai-dev-kit` tools to manually test your changes
You can now interact with the `data-agent-kit-starter-pack` tools to manually test your changes
against your connected database.

### Adding or Updating Skills
Expand Down
119 changes: 93 additions & 26 deletions README.md
Original file line number Diff line number Diff line change
@@ -1,49 +1,115 @@
# Data Cloud AI Dev Kit
# Data Agent Kit Starter Pack

> [!NOTE]
> This extension is currently in beta (pre-v1.0), and may see breaking changes until the first stable release (v1.0).

This plugin provides a specialized suite of skills and MCP tools for data engineers and database practitioners working on Google Cloud. It acts as an expert assistant, allowing you to use natural language prompts in your preferred coding agent to architect complex data pipelines, transform data with dbt, write Spark and BigQuery SQL notebooks, and orchestrate end-to-end workflows across GCP's data ecosystem (BigQuery, Spanner, BigLake, Dataproc, etc.).
This plugin provides a specialized suite of skills and MCP tools for data engineers and database practitioners working on Google Cloud. It acts as an expert assistant, allowing you to use natural language prompts in your preferred coding agent to architect complex data pipelines, transform data with dbt, write Spark and BigQuery SQL notebooks, and orchestrate end-to-end workflows across the Google Cloud data ecosystem (BigQuery, Spanner, BigLake, Dataproc, etc.).

> [!IMPORTANT]
> **We Want Your Feedback!**
> Please share your thoughts with us by opening an issue on GitHub. Your input is invaluable and helps us improve the project for everyone.

## Why Use the Data Cloud AI Dev Kit?
## Why Use the Data Agent Kit Starter Pack?

* **Seamless Workflow:** Brings Google Cloud data engineering expertise directly into your terminal or IDE via Gemini CLI, Claude Code, or Codex.
* **End-to-End Data Pipelines:** Effortlessly generate code that reads raw data from GCS, processes it with Spark or BigQuery, transforms it through medallion architectures (bronze, silver, gold) using dbt, and exports it to serving layers like Cloud Spanner.
* **Ecosystem Integration:** Work across boundaries—generate BigLake Iceberg catalog tables, train BigQuery ML models (XGBoost, KMEANS), and create interactive Streamlit dashboards or LookML models all from natural language.
* **Seamless Workflow:** Bring Google Cloud data engineering expertise directly into your terminal or IDE via Gemini CLI, Claude Code, or Codex.
* **End-to-End Data Pipelines:** Effortlessly generate code that reads raw data from Cloud Storage, processes it with Spark or BigQuery, transform it through medallion architectures (bronze, silver, gold) using dbt, and export it to serving layers like Spanner.
* **Ecosystem Integration:** Work across boundaries—generate BigLake Iceberg catalog tables, train BigQuery ML models (XGBoost, KMEANS), and create interactive Streamlit dashboards or LookML models, all from natural language.
* **Workflow Orchestration:** Automatically create and schedule orchestration pipelines that tie your notebooks and dbt models together into robust, scheduled jobs.

## Prerequisites

Ensure you have one of the following coding agents installed:
* [Gemini CLI](https://github.com/google-gemini/gemini-cli) (v0.6.0+)
* [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude-code/overview)
* Codex CLI
Ensure you have the following installed:
* **Node.js and npm** (Latest version recommended)
* One of the following coding agents:
* [Gemini CLI](https://github.com/google-gemini/gemini-cli) (v0.6.0+)
* [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude-code/overview)
* Codex CLI
* **(Optional) IDE Extension:** [Google Cloud Data Agent Kit](https://docs.cloud.google.com/data-cloud-extension/vs-code/install).

## Getting Started

### Installation

Choose the installation method for your preferred coding agent.
Choose the installation method for your preferred coding agent. Run the commands in terminal

#### Gemini CLI
<details>
<summary><b>Gemini CLI and Gemini Code Assist</b></summary>

```bash
gemini extensions install https://github.com/gemini-cli-extensions/data-agent-kit-starter-pack
```
</details>

<details>
<summary><b>Claude Code</b></summary>

Run the `claude` command to start the agent, then run:

```bash
/plugin marketplace add https://github.com/gemini-cli-extensions/data-agent-kit-starter-pack
/plugin install data-agent-kit-starter-pack@data-agent-kit-starter-pack-marketplace
```
</details>

<details>
<summary><b>Codex</b></summary>

Run the following commands in your terminal:

**macOS / Linux:**
```bash
gemini extensions install https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit
curl -sSL https://raw.githubusercontent.com/gemini-cli-extensions/data-agent-kit-starter-pack/main/codex-install.sh | bash
```

#### Claude Code
**Windows:**
```powershell
irm https://raw.githubusercontent.com/gemini-cli-extensions/data-agent-kit-starter-pack/main/codex-install.ps1 | iex
```

After running the installation script, run the `codex` command to start the agent, then run:

```bash
/plugin marketplace add https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit
/plugin install data-cloud-ai-dev-kit@data-cloud-ai-dev-kit-marketplace
/plugins
```

#### Codex (One-Liner)
Use the interactive options to install the extension with the name `Data Agent Kit Starter Pack`.
</details>

### Configuration

MCP toolboxes are added to the respective agent configuration files. You must configure the MCP toolboxes in your agent's configuration files for them to start successfully.

In all cases, you must restart the agent after updating the configuration files.

<details>
<summary><b>Gemini CLI and Gemini Code Assist</b></summary>

Edit the configuration file:
`~/.gemini/extensions/data-agent-kit-starter-pack/gemini-extension.json`
</details>

<details>
<summary><b>Claude Code</b></summary>

1. Edit the configuration file:
`~/.claude/plugins/cache/data-agent-kit-starter-pack-marketplace/data-agent-kit-starter-pack/<version>/.mcp.json`

2. Reinstall the plugin:
Run `/plugin` and use interactive options to uninstall `data-agent-kit-starter-pack`. Then run `/plugin install` to add it back.
</details>

<details>
<summary><b>Codex</b></summary>

1. Edit the configuration file:
`~/.agents/plugins/data-agent-kit-starter-pack/.mcp.json`

2. Use interactive options to uninstall and install the extension:
```bash
curl -sSL https://raw.githubusercontent.com/gemini-cli-extensions/data-cloud-ai-dev-kit/main/codex-install.sh | bash
/plugins
```
Install with name: `Data Agent Kit Starter Pack`
</details>

## Usage Examples

Expand All @@ -67,14 +133,15 @@ Interact with your coding agent using natural language prompts to perform comple

* **Plugin Not Found:** Ensure you have restarted your agent (e.g., Gemini CLI or Codex) after installation.
* **Authentication Errors:** Many GCP skills require an active authenticated session. Ensure you have run `gcloud auth login` and `gcloud auth application-default login` on your machine.
* **MCP Connection Issues:** Update the MCP server configurations such as project, region etc. needed by MCP toolboxes in order to connect successfully to them.

## Security Reminder: Agent Environment Hardening

Your agent has the power to
execute tools and commands on your behalf. Protect your GCP resources by
enforcing **Strict Least Privilege** across all CLIs, MCP servers and other
resources available to your agents. For example, use scoped Service Accounts
(read more
[here](https://docs.cloud.google.com/docs/authentication/use-service-account-impersonation))
for tasks accessing your cloud resources and conducting regular permission and
agent settings audits to minimize your attack surface.
Your agent has the power to execute tools and commands on your behalf. Protect your GCP resources by enforcing **Strict Least Privilege** across all CLIs, MCP servers and other resources available to your agents.

* Use [service accounts](https://docs.cloud.google.com/docs/authentication/use-service-account-impersonation) for accessing your cloud resources.
* Assign the service account a role with [limited permissions](https://docs.cloud.google.com/iam/docs/roles-overview).
* Prevent unwanted cross-org agent access by utilizing **Principal Access Boundaries** to scope your agent to [projects](https://docs.cloud.google.com/iam/docs/principal-access-boundary-policies#use-case-one-project) you intend the agent to access.

> [!NOTE]
> The Principal Access Boundary condition should bind the policy to the service accounts you intend to restrict.
6 changes: 3 additions & 3 deletions codex-install.ps1
Original file line number Diff line number Diff line change
Expand Up @@ -14,8 +14,8 @@

$ErrorActionPreference = "Stop"

$pluginName = "data-cloud-ai-dev-kit"
$repoUrl = "https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit"
$pluginName = "data-agent-kit-starter-pack"
$repoUrl = "https://github.com/gemini-cli-extensions/data-agent-kit-starter-pack"
$pluginsRoot = Join-Path $HOME ".agents\plugins"
$installDir = Join-Path $pluginsRoot $pluginName
$marketplaceFile = Join-Path $pluginsRoot "marketplace.json"
Expand Down Expand Up @@ -85,7 +85,7 @@ $pluginJson = @"
{
"name": "$pluginName",
"interface": {
"displayName": "Google Data Cloud AI Dev Kit"
"displayName": "Data Agent Kit Starter Pack"
},
"source": {
"source": "local",
Expand Down
6 changes: 3 additions & 3 deletions codex-install.sh
Original file line number Diff line number Diff line change
Expand Up @@ -15,8 +15,8 @@

set -e

PLUGIN_NAME="data-cloud-ai-dev-kit"
REPO_URL="https://github.com/gemini-cli-extensions/data-cloud-ai-dev-kit"
PLUGIN_NAME="data-agent-kit-starter-pack"
REPO_URL="https://github.com/gemini-cli-extensions/data-agent-kit-starter-pack"
INSTALL_DIR="$HOME/.agents/plugins/$PLUGIN_NAME"
MARKETPLACE_FILE="$HOME/.agents/plugins/marketplace.json"

Expand Down Expand Up @@ -53,7 +53,7 @@ data.plugins = data.plugins || [];
data.plugins = data.plugins.filter(p => p.name !== '${PLUGIN_NAME}');
data.plugins.push({
name: '${PLUGIN_NAME}',
interface: { displayName: 'Google Data Cloud AI Dev Kit' },
interface: { displayName: 'Data Agent Kit Starter Pack' },
source: { source: 'local', path: './.agents/plugins/${PLUGIN_NAME}' },
policy: { installation: 'AVAILABLE', authentication: 'ON_INSTALL' },
category: 'Productivity'
Expand Down
Loading
Loading