renovate/lib/manager/bazel/extract.ts
Christopher Sauer c76ca3b170
feat(bazel): Allow updating more types of http_archives, including zip (#7929)
Co-authored-by: Michael Kriese <michael.kriese@visualon.de>
2020-12-10 09:13:47 +01:00

277 lines
8 KiB
TypeScript

/* eslint no-plusplus: 0 */
import { parse as _parse } from 'url';
import parse from 'github-url-from-git';
import * as datasourceDocker from '../../datasource/docker';
import * as datasourceGithubReleases from '../../datasource/github-releases';
import * as datasourceGithubTags from '../../datasource/github-tags';
import * as datasourceGo from '../../datasource/go';
import { logger } from '../../logger';
import { SkipReason } from '../../types';
import { regEx } from '../../util/regex';
import * as dockerVersioning from '../../versioning/docker';
import { PackageDependency, PackageFile } from '../common';
interface UrlParsedResult {
datasource: string;
repo: string;
currentValue: string;
}
function parseUrl(urlString: string): UrlParsedResult | null {
// istanbul ignore if
if (!urlString) {
return null;
}
const url = _parse(urlString);
if (url.host !== 'github.com') {
return null;
}
const path = url.path.split('/').slice(1);
const repo = path[0] + '/' + path[1];
let datasource: string;
let currentValue: string = null;
if (path[2] === 'releases' && path[3] === 'download') {
datasource = datasourceGithubReleases.id;
currentValue = path[4];
}
if (path[2] === 'archive') {
datasource = datasourceGithubTags.id;
currentValue = path[3];
// Strip archive extension to get hash or tag.
// Tolerates formats produced by Git(Hub|Lab) and allowed by http_archive
// Note: Order matters in suffix list to strip, e.g. .tar.gz.
for (const extension of ['.gz', '.bz2', '.xz', '.tar', '.tgz', '.zip']) {
if (currentValue.endsWith(extension)) {
currentValue = currentValue.slice(0, -extension.length);
}
}
}
if (currentValue) {
return { datasource, repo, currentValue };
}
// istanbul ignore next
return null;
}
function findBalancedParenIndex(longString: string): number {
/**
* Minimalistic string parser with single task -> find last char in def.
* It treats [)] as the last char.
* To find needed closing parenthesis we need to increment
* nesting depth when parser feeds opening parenthesis
* if one opening parenthesis -> 1
* if two opening parenthesis -> 2
* if two opening and one closing parenthesis -> 1
* if ["""] found then ignore all [)] until closing ["""] parsed.
* https://github.com/renovatebot/renovate/pull/3459#issuecomment-478249702
*/
let intShouldNotBeOdd = 0; // openClosePythonMultiLineComment
let parenNestingDepth = 1;
return [...longString].findIndex((char, i, arr) => {
switch (char) {
case '(':
parenNestingDepth++;
break;
case ')':
parenNestingDepth--;
break;
case '"':
if (i > 1 && arr.slice(i - 2, i).every((prev) => char === prev)) {
intShouldNotBeOdd++;
}
break;
default:
break;
}
return !parenNestingDepth && !(intShouldNotBeOdd % 2) && char === ')';
});
}
function parseContent(content: string): string[] {
return [
'container_pull',
'http_archive',
'http_file',
'go_repository',
'git_repository',
].reduce(
(acc, prefix) => [
...acc,
...content
.split(regEx(prefix + '\\s*\\(', 'g'))
.slice(1)
.map((base) => {
const ind = findBalancedParenIndex(base);
return ind >= 0 && `${prefix}(${base.slice(0, ind)})`;
})
.filter(Boolean),
],
[] as string[]
);
}
export function extractPackageFile(
content: string,
fileName?: string
): PackageFile | null {
const definitions = parseContent(content);
if (!definitions.length) {
logger.debug({ fileName }, 'No matching bazel WORKSPACE definitions found');
return null;
}
logger.debug({ definitions }, `Found ${definitions.length} definitions`);
const deps: PackageDependency[] = [];
definitions.forEach((def) => {
logger.debug({ def }, 'Checking bazel definition');
const [depType] = def.split('(', 1);
const dep: PackageDependency = { depType, managerData: { def } };
let depName: string;
let importpath: string;
let remote: string;
let currentValue: string;
let commit: string;
let url: string;
let sha256: string;
let digest: string;
let repository: string;
let registry: string;
let match = /name\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, depName] = match;
}
match = /digest\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, digest] = match;
}
match = /registry\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, registry] = match;
}
match = /repository\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, repository] = match;
}
match = /remote\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, remote] = match;
}
match = /tag\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, currentValue] = match;
}
match = /url\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, url] = match;
}
match = /urls\s*=\s*\[\s*"([^\]]+)",?\s*\]/.exec(def);
if (match) {
const urls = match[1].replace(/\s/g, '').split('","');
url = urls.find(parseUrl);
}
match = /commit\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, commit] = match;
}
match = /sha256\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, sha256] = match;
}
match = /importpath\s*=\s*"([^"]+)"/.exec(def);
if (match) {
[, importpath] = match;
}
logger.debug({ dependency: depName, remote, currentValue });
if (
depType === 'git_repository' &&
depName &&
remote &&
(currentValue || commit)
) {
dep.depName = depName;
if (currentValue) {
dep.currentValue = currentValue;
}
if (commit) {
dep.currentDigest = commit;
}
// TODO: Check if we really need to use parse here or if it should always be a plain https url
const githubURL = parse(remote);
if (githubURL) {
const repo = githubURL.substring('https://github.com/'.length);
dep.datasource = datasourceGithubReleases.id;
dep.lookupName = repo;
deps.push(dep);
}
} else if (
depType === 'go_repository' &&
depName &&
importpath &&
(currentValue || commit)
) {
dep.depName = depName;
dep.currentValue = currentValue || commit.substr(0, 7);
dep.datasource = datasourceGo.id;
dep.lookupName = importpath;
if (remote) {
const remoteMatch = /https:\/\/github\.com(?:.*\/)(([a-zA-Z]+)([-])?([a-zA-Z]+))/.exec(
remote
);
if (remoteMatch && remoteMatch[0].length === remote.length) {
dep.lookupName = remote.replace('https://', '');
} else {
dep.skipReason = SkipReason.UnsupportedRemote;
}
}
if (commit) {
dep.currentValue = 'v0.0.0';
dep.currentDigest = commit;
dep.currentDigestShort = commit.substr(0, 7);
dep.digestOneAndOnly = true;
}
deps.push(dep);
} else if (
(depType === 'http_archive' || depType === 'http_file') &&
depName &&
parseUrl(url) &&
sha256
) {
const parsedUrl = parseUrl(url);
dep.depName = depName;
dep.repo = parsedUrl.repo;
if (/^[a-f0-9]{40}$/i.test(parsedUrl.currentValue)) {
dep.currentDigest = parsedUrl.currentValue;
} else {
dep.currentValue = parsedUrl.currentValue;
}
dep.datasource = parsedUrl.datasource;
dep.lookupName = dep.repo;
deps.push(dep);
} else if (
depType === 'container_pull' &&
currentValue &&
digest &&
repository &&
registry
) {
dep.currentDigest = digest;
dep.currentValue = currentValue;
dep.depName = depName;
dep.versioning = dockerVersioning.id;
dep.datasource = datasourceDocker.id;
dep.lookupName = repository;
dep.registryUrls = [registry];
deps.push(dep);
} else {
logger.debug(
{ def },
'Failed to find dependency in bazel WORKSPACE definition'
);
}
});
if (!deps.length) {
return null;
}
return { deps };
}