-
Notifications
You must be signed in to change notification settings - Fork 0
/
dev-count-analysis.ts
240 lines (214 loc) · 7.22 KB
/
dev-count-analysis.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
/**
* This is to count the number of "contributing" developers using Snyk on a given repo.
* "Contributing" is defined as having contributed a commit in the last 90 days.
* This is use only on the `snyk monitor` command as that is used to monitor a project's dependencies in an
* on-going manner.
* It collects only a hash of the email of a git user and the most recent commit timestamp (both per the `git log`
* output) and can be disabled by config (see https://snyk.io/policies/tracking-and-analytics/).
*/
import * as crypto from 'crypto';
import { exec } from 'child_process';
import { Contributor } from '../types';
export const SERIOUS_DELIMITER = '_SNYK_SEPARATOR_';
export const CONTRIBUTING_DEVELOPER_PERIOD_DAYS = 90;
export async function getContributors(
{ endDate, periodDays, repoPath } = {
endDate: new Date(),
periodDays: CONTRIBUTING_DEVELOPER_PERIOD_DAYS,
repoPath: process.cwd(),
},
): Promise<Contributor[]> {
const timestampStartOfContributingDeveloperPeriod = getTimestampStartOfContributingDevTimeframe(
endDate,
periodDays,
);
const gitLogResults = await runGitLog(
timestampStartOfContributingDeveloperPeriod,
repoPath,
execShell,
);
const stats: GitRepoCommitStats = parseGitLog(gitLogResults);
return stats.getRepoContributors();
}
export class GitCommitInfo {
authorHashedEmail: string;
commitTimestamp: string; // use ISO 8601 format
constructor(authorHashedEmail: string, commitTimestamp: string) {
if (isSha1Hash(authorHashedEmail)) {
this.authorHashedEmail = authorHashedEmail;
this.commitTimestamp = commitTimestamp;
} else {
throw new Error('authorHashedEmail must be a sha1 hash');
}
}
}
export class GitRepoCommitStats {
commitInfos: GitCommitInfo[];
constructor(commitInfos: GitCommitInfo[]) {
this.commitInfos = commitInfos;
}
public static empty(): GitRepoCommitStats {
return new GitRepoCommitStats([]);
}
public addCommitInfo(info: GitCommitInfo) {
this.commitInfos.push(info);
}
public getUniqueAuthorsCount(): number {
const uniqueAuthorHashedEmails = this.getUniqueAuthorHashedEmails();
return uniqueAuthorHashedEmails.size;
}
public getCommitsCount(): number {
return this.commitInfos.length;
}
public getUniqueAuthorHashedEmails(): Set<string> {
const allCommitAuthorHashedEmails: string[] = this.commitInfos.map(
(c) => c.authorHashedEmail,
);
const uniqueAuthorHashedEmails: Set<string> = new Set(
allCommitAuthorHashedEmails,
);
return uniqueAuthorHashedEmails;
}
public getRepoContributors(): Contributor[] {
const uniqueAuthorHashedEmails = this.getUniqueAuthorHashedEmails();
const contributors: Contributor[] = [];
// for each uniqueAuthorHashedEmails, get the latest commit
for (const nextUniqueAuthorHashedEmail of uniqueAuthorHashedEmails) {
const latestCommitTimestamp = this.getMostRecentCommitTimestamp(
nextUniqueAuthorHashedEmail,
);
contributors.push({
userId: nextUniqueAuthorHashedEmail,
lastCommitDate: latestCommitTimestamp,
});
}
return contributors;
}
public getMostRecentCommitTimestamp(authorHashedEmail: string): string {
for (const nextGI of this.commitInfos) {
if (nextGI.authorHashedEmail === authorHashedEmail) {
return nextGI.commitTimestamp;
}
}
return '';
}
}
export function parseGitLogLine(logLine: string): GitCommitInfo {
const lineComponents = logLine.split(SERIOUS_DELIMITER);
const authorEmail = lineComponents[2];
const commitTimestamp = lineComponents[3];
const hashedAuthorEmail = hashData(authorEmail);
const commitInfo = new GitCommitInfo(hashedAuthorEmail, commitTimestamp);
return commitInfo;
}
export function parseGitLog(gitLog: string): GitRepoCommitStats {
if (gitLog.trim() === '') {
return GitRepoCommitStats.empty();
}
const logLines = separateLines(gitLog);
const logLineInfos: GitCommitInfo[] = logLines.map(parseGitLogLine);
const stats: GitRepoCommitStats = new GitRepoCommitStats(logLineInfos);
return stats;
}
export function hashData(s: string): string {
const hashedData = crypto
.createHash('sha1')
.update(s)
.digest('hex');
return hashedData;
}
export function isSha1Hash(data: string): boolean {
// sha1 hash must be exactly 40 characters of 0-9 / a-f (i.e. lowercase hex characters)
// ^ == start anchor
// [0-9a-f] == characters 0,1,2,3,4,5,6,7,8,9,a,b,c,d,e,f only
// {40} 40 of the [0-9a-f] characters
// $ == end anchor
const matchRegex = new RegExp('^[0-9a-f]{40}$');
const looksHashed = matchRegex.test(data);
return looksHashed;
}
/**
* @returns time stamp in seconds-since-epoch of 90 days ago since 90 days is the "contributing devs" timeframe
*/
export function getTimestampStartOfContributingDevTimeframe(
dNow: Date,
timespanInDays: number = CONTRIBUTING_DEVELOPER_PERIOD_DAYS,
): number {
const nowUtcEpocMS = dNow.getTime();
const nowUtcEpocS = Math.floor(nowUtcEpocMS / 1000);
const ONE_DAY_IN_SECONDS = 86400;
const lookbackTimespanSeconds = timespanInDays * ONE_DAY_IN_SECONDS;
const startOfPeriodEpochSeconds = nowUtcEpocS - lookbackTimespanSeconds;
return startOfPeriodEpochSeconds;
}
export async function runGitLog(
timestampEpochSecondsStartOfPeriod: number,
repoPath: string,
fnShellout: (cmd: string, workingDirectory: string) => Promise<string>,
): Promise<string> {
try {
const gitLogCommand = `git --no-pager log --no-merges --pretty=tformat:"%H${SERIOUS_DELIMITER}%an${SERIOUS_DELIMITER}%ae${SERIOUS_DELIMITER}%aI" --after="${timestampEpochSecondsStartOfPeriod}"`;
const gitLogStdout: string = await fnShellout(gitLogCommand, repoPath);
return gitLogStdout;
} catch {
return '';
}
}
export function separateLines(inputText: string): string[] {
const linuxStyleNewLine = '\n';
const windowsStyleNewLine = '\r\n';
const reg = new RegExp(`${linuxStyleNewLine}|${windowsStyleNewLine}`);
const lines = inputText.trim().split(reg);
return lines;
}
export function execShell(
cmd: string,
workingDirectory: string,
): Promise<string> {
const options = {
cwd: workingDirectory,
};
return new Promise((resolve, reject) => {
exec(cmd, options, (error, stdout, stderr) => {
if (error) {
// TODO: we can probably remove this after unshipping Node 8 support
// and then just directly get the error code like `error.code`
let exitCode = 0;
try {
exitCode = parseInt(error['code']);
} catch {
exitCode = -1;
}
const e = new ShellOutError(
error.message,
exitCode,
stdout,
stderr,
error,
);
reject(e);
} else {
resolve(stdout ? stdout : stderr);
}
});
});
}
export class ShellOutError extends Error {
public innerError: Error | undefined;
public exitCode: number | undefined;
public stdout: string | undefined;
public stderr: string | undefined;
constructor(
message: string,
exitCode: number | undefined,
stdout: string,
stderr: string,
innerError: Error | undefined,
) {
super(message);
this.exitCode = exitCode;
this.stdout = stdout;
this.stderr = stderr;
this.innerError = innerError;
}
}