mirror of
https://github.com/github/codeql-action.git
synced 2025-12-28 10:10:17 +08:00
345 lines
12 KiB
TypeScript
345 lines
12 KiB
TypeScript
import * as fs from "fs";
|
|
import * as path from "path";
|
|
|
|
import * as toolrunner from "@actions/exec/lib/toolrunner";
|
|
|
|
import * as analysisPaths from "./analysis-paths";
|
|
import { getCodeQL } from "./codeql";
|
|
import * as configUtils from "./config-utils";
|
|
import { countLoc, getIdPrefix } from "./count-loc";
|
|
import { isScannedLanguage, Language } from "./languages";
|
|
import { Logger } from "./logging";
|
|
import * as sharedEnv from "./shared-environment";
|
|
import { combineSarifFiles } from "./upload-lib";
|
|
import * as util from "./util";
|
|
|
|
export class CodeQLAnalysisError extends Error {
|
|
queriesStatusReport: QueriesStatusReport;
|
|
|
|
constructor(queriesStatusReport: QueriesStatusReport, message: string) {
|
|
super(message);
|
|
|
|
this.name = "CodeQLAnalysisError";
|
|
this.queriesStatusReport = queriesStatusReport;
|
|
}
|
|
}
|
|
|
|
export interface QueriesStatusReport {
|
|
// Time taken in ms to analyze builtin queries for cpp (or undefined if this language was not analyzed)
|
|
analyze_builtin_queries_cpp_duration_ms?: number;
|
|
// Time taken in ms to analyze builtin queries for csharp (or undefined if this language was not analyzed)
|
|
analyze_builtin_queries_csharp_duration_ms?: number;
|
|
// Time taken in ms to analyze builtin queries for go (or undefined if this language was not analyzed)
|
|
analyze_builtin_queries_go_duration_ms?: number;
|
|
// Time taken in ms to analyze builtin queries for java (or undefined if this language was not analyzed)
|
|
analyze_builtin_queries_java_duration_ms?: number;
|
|
// Time taken in ms to analyze builtin queries for javascript (or undefined if this language was not analyzed)
|
|
analyze_builtin_queries_javascript_duration_ms?: number;
|
|
// Time taken in ms to analyze builtin queries for python (or undefined if this language was not analyzed)
|
|
analyze_builtin_queries_python_duration_ms?: number;
|
|
// Time taken in ms to analyze builtin queries for ruby (or undefined if this language was not analyzed)
|
|
analyze_builtin_queries_ruby_duration_ms?: number;
|
|
// Time taken in ms to analyze custom queries for cpp (or undefined if this language was not analyzed)
|
|
analyze_custom_queries_cpp_duration_ms?: number;
|
|
// Time taken in ms to analyze custom queries for csharp (or undefined if this language was not analyzed)
|
|
analyze_custom_queries_csharp_duration_ms?: number;
|
|
// Time taken in ms to analyze custom queries for go (or undefined if this language was not analyzed)
|
|
analyze_custom_queries_go_duration_ms?: number;
|
|
// Time taken in ms to analyze custom queries for java (or undefined if this language was not analyzed)
|
|
analyze_custom_queries_java_duration_ms?: number;
|
|
// Time taken in ms to analyze custom queries for javascript (or undefined if this language was not analyzed)
|
|
analyze_custom_queries_javascript_duration_ms?: number;
|
|
// Time taken in ms to analyze custom queries for python (or undefined if this language was not analyzed)
|
|
analyze_custom_queries_python_duration_ms?: number;
|
|
// Time taken in ms to analyze custom queries for ruby (or undefined if this language was not analyzed)
|
|
analyze_custom_queries_ruby_duration_ms?: number;
|
|
// Name of language that errored during analysis (or undefined if no language failed)
|
|
analyze_failure_language?: string;
|
|
}
|
|
|
|
async function setupPythonExtractor(logger: Logger) {
|
|
const codeqlPython = process.env["CODEQL_PYTHON"];
|
|
if (codeqlPython === undefined || codeqlPython.length === 0) {
|
|
// If CODEQL_PYTHON is not set, no dependencies were installed, so we don't need to do anything
|
|
return;
|
|
}
|
|
|
|
let output = "";
|
|
const options = {
|
|
listeners: {
|
|
stdout: (data: Buffer) => {
|
|
output += data.toString();
|
|
},
|
|
},
|
|
};
|
|
|
|
await new toolrunner.ToolRunner(
|
|
codeqlPython,
|
|
[
|
|
"-c",
|
|
"import os; import pip; print(os.path.dirname(os.path.dirname(pip.__file__)))",
|
|
],
|
|
options
|
|
).exec();
|
|
logger.info(`Setting LGTM_INDEX_IMPORT_PATH=${output}`);
|
|
process.env["LGTM_INDEX_IMPORT_PATH"] = output;
|
|
|
|
output = "";
|
|
await new toolrunner.ToolRunner(
|
|
codeqlPython,
|
|
["-c", "import sys; print(sys.version_info[0])"],
|
|
options
|
|
).exec();
|
|
logger.info(`Setting LGTM_PYTHON_SETUP_VERSION=${output}`);
|
|
process.env["LGTM_PYTHON_SETUP_VERSION"] = output;
|
|
}
|
|
|
|
async function createdDBForScannedLanguages(
|
|
config: configUtils.Config,
|
|
logger: Logger
|
|
) {
|
|
// Insert the LGTM_INDEX_X env vars at this point so they are set when
|
|
// we extract any scanned languages.
|
|
analysisPaths.includeAndExcludeAnalysisPaths(config);
|
|
|
|
const codeql = getCodeQL(config.codeQLCmd);
|
|
for (const language of config.languages) {
|
|
if (isScannedLanguage(language)) {
|
|
logger.startGroup(`Extracting ${language}`);
|
|
|
|
if (language === Language.python) {
|
|
await setupPythonExtractor(logger);
|
|
}
|
|
|
|
await codeql.extractScannedLanguage(
|
|
util.getCodeQLDatabasePath(config, language),
|
|
language
|
|
);
|
|
logger.endGroup();
|
|
}
|
|
}
|
|
}
|
|
|
|
async function finalizeDatabaseCreation(
|
|
config: configUtils.Config,
|
|
threadsFlag: string,
|
|
logger: Logger
|
|
) {
|
|
await createdDBForScannedLanguages(config, logger);
|
|
|
|
const codeql = getCodeQL(config.codeQLCmd);
|
|
for (const language of config.languages) {
|
|
logger.startGroup(`Finalizing ${language}`);
|
|
await codeql.finalizeDatabase(
|
|
util.getCodeQLDatabasePath(config, language),
|
|
threadsFlag
|
|
);
|
|
logger.endGroup();
|
|
}
|
|
}
|
|
|
|
// Runs queries and creates sarif files in the given folder
|
|
export async function runQueries(
|
|
sarifFolder: string,
|
|
memoryFlag: string,
|
|
addSnippetsFlag: string,
|
|
threadsFlag: string,
|
|
automationDetailsId: string | undefined,
|
|
config: configUtils.Config,
|
|
logger: Logger
|
|
): Promise<QueriesStatusReport> {
|
|
const statusReport: QueriesStatusReport = {};
|
|
|
|
// count the number of lines in the background
|
|
const locPromise = countLoc(
|
|
path.resolve(),
|
|
// config.paths specifies external directories. the current
|
|
// directory is included in the analysis by default. Replicate
|
|
// that here.
|
|
config.paths,
|
|
config.pathsIgnore,
|
|
config.languages,
|
|
logger
|
|
);
|
|
|
|
for (const language of config.languages) {
|
|
logger.startGroup(`Analyzing ${language}`);
|
|
|
|
const queries = config.queries[language];
|
|
if (
|
|
queries === undefined ||
|
|
(queries.builtin.length === 0 && queries.custom.length === 0)
|
|
) {
|
|
throw new Error(
|
|
`Unable to analyse ${language} as no queries were selected for this language`
|
|
);
|
|
}
|
|
|
|
try {
|
|
let analysisSummary = "";
|
|
if (queries["builtin"].length > 0) {
|
|
const startTimeBuliltIn = new Date().getTime();
|
|
const { sarifFile, stdout } = await runQueryGroup(
|
|
language,
|
|
"builtin",
|
|
queries["builtin"],
|
|
sarifFolder,
|
|
undefined
|
|
);
|
|
analysisSummary = stdout;
|
|
await injectLinesOfCode(sarifFile, language, locPromise);
|
|
|
|
statusReport[`analyze_builtin_queries_${language}_duration_ms`] =
|
|
new Date().getTime() - startTimeBuliltIn;
|
|
}
|
|
const startTimeCustom = new Date().getTime();
|
|
const temporarySarifDir = config.tempDir;
|
|
const temporarySarifFiles: string[] = [];
|
|
for (let i = 0; i < queries["custom"].length; ++i) {
|
|
if (queries["custom"][i].queries.length > 0) {
|
|
const { sarifFile } = await runQueryGroup(
|
|
language,
|
|
`custom-${i}`,
|
|
queries["custom"][i].queries,
|
|
temporarySarifDir,
|
|
queries["custom"][i].searchPath
|
|
);
|
|
temporarySarifFiles.push(sarifFile);
|
|
}
|
|
}
|
|
if (temporarySarifFiles.length > 0) {
|
|
const sarifFile = path.join(sarifFolder, `${language}-custom.sarif`);
|
|
fs.writeFileSync(sarifFile, combineSarifFiles(temporarySarifFiles));
|
|
await injectLinesOfCode(sarifFile, language, locPromise);
|
|
|
|
statusReport[`analyze_custom_queries_${language}_duration_ms`] =
|
|
new Date().getTime() - startTimeCustom;
|
|
}
|
|
logger.endGroup();
|
|
|
|
// Print the LoC baseline and the summary results from database analyze.
|
|
logger.startGroup(`Analysis summary for ${language}`);
|
|
printLinesOfCodeSummary(logger, language, await locPromise);
|
|
logger.info(analysisSummary);
|
|
logger.endGroup();
|
|
} catch (e) {
|
|
logger.info(e);
|
|
statusReport.analyze_failure_language = language;
|
|
throw new CodeQLAnalysisError(
|
|
statusReport,
|
|
`Error running analysis for ${language}: ${e}`
|
|
);
|
|
}
|
|
}
|
|
|
|
return statusReport;
|
|
|
|
async function runQueryGroup(
|
|
language: Language,
|
|
type: string,
|
|
queries: string[],
|
|
destinationFolder: string,
|
|
searchPath: string | undefined
|
|
): Promise<{ sarifFile: string; stdout: string }> {
|
|
const databasePath = util.getCodeQLDatabasePath(config, language);
|
|
// Pass the queries to codeql using a file instead of using the command
|
|
// line to avoid command line length restrictions, particularly on windows.
|
|
const querySuitePath = `${databasePath}-queries-${type}.qls`;
|
|
const querySuiteContents = queries
|
|
.map((q: string) => `- query: ${q}`)
|
|
.join("\n");
|
|
fs.writeFileSync(querySuitePath, querySuiteContents);
|
|
logger.debug(`Query suite file for ${language}...\n${querySuiteContents}`);
|
|
|
|
const sarifFile = path.join(destinationFolder, `${language}-${type}.sarif`);
|
|
|
|
const codeql = getCodeQL(config.codeQLCmd);
|
|
const databaseAnalyzeStdout = await codeql.databaseAnalyze(
|
|
databasePath,
|
|
sarifFile,
|
|
searchPath,
|
|
querySuitePath,
|
|
memoryFlag,
|
|
addSnippetsFlag,
|
|
threadsFlag,
|
|
automationDetailsId
|
|
);
|
|
|
|
logger.debug(
|
|
`SARIF results for database ${language} created at "${sarifFile}"`
|
|
);
|
|
return { sarifFile, stdout: databaseAnalyzeStdout };
|
|
}
|
|
}
|
|
|
|
export async function runAnalyze(
|
|
outputDir: string,
|
|
memoryFlag: string,
|
|
addSnippetsFlag: string,
|
|
threadsFlag: string,
|
|
automationDetailsId: string | undefined,
|
|
config: configUtils.Config,
|
|
logger: Logger
|
|
): Promise<QueriesStatusReport> {
|
|
// Delete the tracer config env var to avoid tracing ourselves
|
|
delete process.env[sharedEnv.ODASA_TRACER_CONFIGURATION];
|
|
|
|
fs.mkdirSync(outputDir, { recursive: true });
|
|
|
|
logger.info("Finalizing database creation");
|
|
await finalizeDatabaseCreation(config, threadsFlag, logger);
|
|
|
|
logger.info("Analyzing database");
|
|
const queriesStats = await runQueries(
|
|
outputDir,
|
|
memoryFlag,
|
|
addSnippetsFlag,
|
|
threadsFlag,
|
|
automationDetailsId,
|
|
config,
|
|
logger
|
|
);
|
|
|
|
return { ...queriesStats };
|
|
}
|
|
|
|
async function injectLinesOfCode(
|
|
sarifFile: string,
|
|
language: Language,
|
|
locPromise: Promise<Partial<Record<Language, number>>>
|
|
) {
|
|
const lineCounts = await locPromise;
|
|
const idPrefix = getIdPrefix(language);
|
|
if (language in lineCounts) {
|
|
const sarif = JSON.parse(fs.readFileSync(sarifFile, "utf8"));
|
|
if (Array.isArray(sarif.runs)) {
|
|
for (const run of sarif.runs) {
|
|
const ruleId = `${idPrefix}/summary/lines-of-code`;
|
|
run.properties = run.properties || {};
|
|
run.properties.metricResults = run.properties.metricResults || [];
|
|
const rule = run.properties.metricResults.find(
|
|
// the rule id can be in either of two places
|
|
(r) => r.ruleId === ruleId || r.rule?.id === ruleId
|
|
);
|
|
// only add the baseline value if the rule already exists
|
|
if (rule) {
|
|
rule.baseline = lineCounts[language];
|
|
}
|
|
}
|
|
}
|
|
fs.writeFileSync(sarifFile, JSON.stringify(sarif));
|
|
}
|
|
}
|
|
|
|
function printLinesOfCodeSummary(
|
|
logger: Logger,
|
|
language: Language,
|
|
lineCounts: Partial<Record<Language, number>>
|
|
) {
|
|
if (language in lineCounts) {
|
|
logger.info(
|
|
`Counted ${lineCounts[language]} lines of code for ${language} as a baseline.`
|
|
);
|
|
}
|
|
}
|