-
Notifications
You must be signed in to change notification settings - Fork 259
Expand file tree
/
Copy pathgit.ts
More file actions
457 lines (412 loc) · 13.7 KB
/
git.ts
File metadata and controls
457 lines (412 loc) · 13.7 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
import { env, createLogger } from "@sourcebot/shared";
import { existsSync } from 'node:fs';
import { mkdir } from 'node:fs/promises';
import { dirname, resolve } from 'node:path';
import { CheckRepoActions, GitConfigScope, simpleGit, SimpleGitProgressEvent } from 'simple-git';
type onProgressFn = (event: SimpleGitProgressEvent) => void;
const logger = createLogger('git-utils');
/**
* Creates a simple-git client that has it's working directory
* set to the given path.
*/
const createGitClientForPath = (path: string, onProgress?: onProgressFn, signal?: AbortSignal) => {
if (!existsSync(path)) {
throw new Error(`Path ${path} does not exist`);
}
const parentPath = resolve(dirname(path));
const git = simpleGit({
progress: onProgress,
abort: signal,
})
.env({
...process.env,
/**
* @note on some inside-baseball on why this is necessary: The specific
* issue we saw was that a `git clone` would fail without throwing, and
* then a subsequent `git config` command would run, but since the clone
* failed, it wouldn't be running in a git directory. Git would then walk
* up the directory tree until it either found a git directory (in the case
* of the development env) or it would hit a GIT_DISCOVERY_ACROSS_FILESYSTEM
* error when trying to cross a filesystem boundary (in the prod case).
* GIT_CEILING_DIRECTORIES ensures that this walk will be limited to the
* parent directory.
*/
GIT_CEILING_DIRECTORIES: parentPath,
/**
* Disable git credential prompts. This ensures that git operations will fail
* immediately if credentials are not available, rather than prompting for input.
*/
GIT_TERMINAL_PROMPT: '0',
})
.cwd({
path,
});
return git;
}
export const cloneRepository = async (
{
cloneUrl,
authHeader,
path,
onProgress,
signal,
}: {
cloneUrl: string,
authHeader?: string,
path: string,
onProgress?: onProgressFn
signal?: AbortSignal
}
) => {
try {
await mkdir(path, { recursive: true });
const git = createGitClientForPath(path, onProgress, signal);
const cloneArgs = [
"--bare",
...(authHeader ? ["-c", `http.extraHeader=${authHeader}`] : [])
];
await git.clone(cloneUrl, path, cloneArgs);
await unsetGitConfig({
path,
keys: ["remote.origin.url"],
signal,
});
// @note: operations that need to iterate over a lot of commits (e.g., rev-list --count)
// can be slow on larger repositories. Commit graphs are a acceleration structure that
// speed up these operations.
// @see: https://git-scm.com/docs/commit-graph
await writeCommitGraph({ path, signal });
} catch (error: unknown) {
const baseLog = `Failed to clone repository: ${path}`;
if (env.SOURCEBOT_LOG_LEVEL !== "debug") {
// Avoid printing the remote URL (that may contain credentials) to logs by default.
throw new Error(`${baseLog}. Set environment variable SOURCEBOT_LOG_LEVEL=debug to see the full error message.`);
} else if (error instanceof Error) {
throw new Error(`${baseLog}. Reason: ${error.message}`);
} else {
throw new Error(`${baseLog}. Error: ${error}`);
}
}
};
export const fetchRepository = async (
{
cloneUrl,
authHeader,
path,
onProgress,
signal,
}: {
cloneUrl: string,
authHeader?: string,
path: string,
onProgress?: onProgressFn,
signal?: AbortSignal
}
) => {
const git = createGitClientForPath(path, onProgress, signal);
try {
if (authHeader) {
await git.addConfig("http.extraHeader", authHeader);
}
await git.fetch([
cloneUrl,
"+refs/heads/*:refs/heads/*",
"--prune",
"--progress",
// On fetch, ensure the commit graph is up to date.
// @see: https://git-scm.com/docs/commit-graph
"--write-commit-graph"
]);
// Update HEAD to match the remote's default branch. This handles the case where the remote's
// default branch changes.
const remoteDefaultBranch = await getRemoteDefaultBranch({
path,
cloneUrl,
});
if (remoteDefaultBranch) {
await git.raw(['symbolic-ref', 'HEAD', `refs/heads/${remoteDefaultBranch}`]);
}
} catch (error: unknown) {
const baseLog = `Failed to fetch repository: ${path}`;
if (env.SOURCEBOT_LOG_LEVEL !== "debug") {
// Avoid printing the remote URL (that may contain credentials) to logs by default.
throw new Error(`${baseLog}. Set environment variable SOURCEBOT_LOG_LEVEL=debug to see the full error message.`);
} else if (error instanceof Error) {
throw new Error(`${baseLog}. Reason: ${error.message}`);
} else {
throw new Error(`${baseLog}. Error: ${error}`);
}
} finally {
if (authHeader) {
await git.raw(["config", "--unset", "http.extraHeader", authHeader]);
}
}
}
/**
* Applies the gitConfig to the repo at the given path. Note that this will
* override the values for any existing keys, and append new values for keys
* that do not exist yet. It will _not_ remove any existing keys that are not
* present in gitConfig.
*/
export const upsertGitConfig = async (
{
path,
gitConfig,
onProgress,
signal,
}: {
path: string,
gitConfig: Record<string, string>,
onProgress?: onProgressFn,
signal?: AbortSignal
}) => {
const git = createGitClientForPath(path, onProgress, signal);
try {
for (const [key, value] of Object.entries(gitConfig)) {
await git.addConfig(key, value);
}
} catch (error: unknown) {
if (error instanceof Error) {
throw new Error(`Failed to set git config ${path}: ${error.message}`);
} else {
throw new Error(`Failed to set git config ${path}: ${error}`);
}
}
}
/**
* Unsets the specified keys in the git config for the repo at the given path.
* If a key is not set, this is a no-op.
*/
export const unsetGitConfig = async (
{
path,
keys,
onProgress,
signal,
}: {
path: string,
keys: string[],
onProgress?: onProgressFn,
signal?: AbortSignal
}) => {
const git = createGitClientForPath(path, onProgress, signal);
try {
const configList = await git.listConfig();
const setKeys = Object.keys(configList.all);
for (const key of keys) {
if (setKeys.includes(key)) {
await git.raw(['config', '--unset', key]);
}
}
} catch (error: unknown) {
if (error instanceof Error) {
throw new Error(`Failed to unset git config ${path}: ${error.message}`);
} else {
throw new Error(`Failed to unset git config ${path}: ${error}`);
}
}
}
/**
* Returns true if `path` is the _root_ of a git repository.
*/
export const isPathAValidGitRepoRoot = async ({
path,
onProgress,
signal,
}: {
path: string,
onProgress?: onProgressFn,
signal?: AbortSignal
}) => {
if (!existsSync(path)) {
return false;
}
const git = createGitClientForPath(path, onProgress, signal);
try {
return git.checkIsRepo(CheckRepoActions.IS_REPO_ROOT);
} catch (error: unknown) {
if (error instanceof Error) {
throw new Error(`isPathAGitRepoRoot failed: ${error.message}`);
} else {
throw new Error(`isPathAGitRepoRoot failed: ${error}`);
}
}
}
export const isUrlAValidGitRepo = async (url: string) => {
const git = simpleGit();
// List the remote heads. If an exception is thrown, the URL is not a valid git repo.
try {
const result = await git.listRemote(['--heads', url]);
return result.trim().length > 0;
} catch (error: unknown) {
return false;
}
}
export const getOriginUrl = async (path: string) => {
const git = createGitClientForPath(path);
try {
const remotes = await git.getConfig('remote.origin.url', GitConfigScope.local);
return remotes.value;
} catch (error: unknown) {
if (error instanceof Error) {
throw new Error(`Failed to get origin for ${path}: ${error.message}`);
} else {
throw new Error(`Failed to get origin for ${path}: ${error}`);
}
}
}
export const getBranches = async (path: string) => {
const git = createGitClientForPath(path);
const branches = await git.branch();
return branches.all;
}
export const getTags = async (path: string) => {
const git = createGitClientForPath(path);
const tags = await git.tags();
return tags.all;
}
export const getCommitHashForRefName = async ({
path,
refName,
}: {
path: string,
refName: string,
}) => {
const git = createGitClientForPath(path);
try {
// The `^{commit}` suffix is used to fully dereference the ref to a commit hash.
const rev = await git.revparse(`${refName}^{commit}`);
return rev;
// @note: Was hitting errors when the repository is empty,
// so we're catching the error and returning undefined.
} catch (error: unknown) {
logger.debug(error);
return undefined;
}
}
/**
* Gets the default branch name from the remote repository by querying what
* the remote's HEAD symbolic ref points to.
*
* This is useful for detecting when a remote repository's default branch has
* changed (e.g., from "master" to "main").
*
* @returns The branch name (e.g., "main", "master") or undefined if it cannot be determined
*/
export const getRemoteDefaultBranch = async ({
path,
cloneUrl,
}: {
path: string,
cloneUrl: string,
}) => {
const git = createGitClientForPath(path);
try {
const remoteHead = await git.raw(['ls-remote', '--symref', cloneUrl, 'HEAD']);
const match = remoteHead.match(/^ref: refs\/heads\/(\S+)\s+HEAD/m);
if (match) {
return match[1];
}
} catch (error: unknown) {
// Avoid printing error here since cloneUrl may contain credentials.
console.error(`Failed to get remote default branch for repository: ${path}`);
return undefined;
}
}
/**
* Gets the branch name that the local HEAD symbolic ref points to.
*
* In a git repository, HEAD is typically a symbolic reference that points to
* a branch (e.g., refs/heads/main). This function resolves that symbolic ref
* and returns just the branch name.
*
* @returns The branch name (e.g., "main", "master") or undefined if HEAD is not a symbolic ref
*/
export const getLocalDefaultBranch = async ({
path,
}: {
path: string,
}) => {
const git = createGitClientForPath(path);
try {
const ref = await git.raw(['symbolic-ref', 'HEAD']);
// Returns something like "refs/heads/main\n", so trim and remove prefix
const trimmed = ref.trim();
const match = trimmed.match(/^refs\/heads\/(.+)$/);
if (match) {
return match[1];
}
} catch (error: unknown) {
console.error(`Failed to get local default branch for repository: ${path}`);
return undefined;
}
}
/**
* Gets the timestamp of the most recent commit across all branches.
*
* @returns The Date of the most recent commit, or undefined if the repository
* is empty or if there's an error retrieving the timestamp.
*/
export const getLatestCommitTimestamp = async ({
path,
}: {
path: string,
}): Promise<Date | undefined> => {
const git = createGitClientForPath(path);
try {
// git log --all -1 --format=%aI returns the author date of the most recent commit
// across all branches in ISO 8601 format
const result = await git.raw(['log', '--all', '-1', '--format=%aI']);
const trimmed = result.trim();
if (!trimmed) {
return undefined; // Empty repository
}
const date = new Date(trimmed);
if (isNaN(date.getTime())) {
logger.warn(`Failed to parse commit timestamp: ${trimmed}`);
return undefined;
}
return date;
} catch (error) {
logger.debug(`Failed to get latest commit timestamp for ${path}:`, error);
return undefined;
}
}
/**
* Returns true if the git repository at the given path has no commits.
*/
export const isRepoEmpty = async ({
path,
}: {
path: string,
}): Promise<boolean> => {
const git = createGitClientForPath(path);
try {
const result = await git.raw(['log', '--all', '-1', '--format=%H']);
return result.trim() === '';
} catch {
return true;
}
}
/**
* Writes or updates the commit-graph file for the repository.
* This pre-computes commit metadata to speed up operations like
* rev-list --count, log, and merge-base.
*/
export const writeCommitGraph = async ({
path,
onProgress,
signal,
}: {
path: string,
onProgress?: onProgressFn,
signal?: AbortSignal,
}): Promise<void> => {
const git = createGitClientForPath(path, onProgress, signal);
try {
await git.raw(['commit-graph', 'write', '--reachable']);
} catch (error) {
// Don't throw an exception here since this is just a performance optimization.
logger.debug(`Failed to write commit-graph for ${path}:`, error);
}
}