mirror of
https://github.com/github/codeql-action.git
synced 2025-12-27 09:40:17 +08:00
435 lines
15 KiB
TypeScript
435 lines
15 KiB
TypeScript
import * as fs from "fs";
|
|
import * as path from "path";
|
|
import { performance } from "perf_hooks";
|
|
|
|
import * as toolrunner from "@actions/exec/lib/toolrunner";
|
|
import del from "del";
|
|
import * as yaml from "js-yaml";
|
|
|
|
import {
|
|
CODEQL_VERSION_ANALYSIS_SUMMARY_V2,
|
|
CodeQL,
|
|
getCodeQL,
|
|
} from "./codeql";
|
|
import * as configUtils from "./config-utils";
|
|
import {
|
|
FeatureEnablement,
|
|
Feature,
|
|
isPythonDependencyInstallationDisabled,
|
|
} from "./feature-flags";
|
|
import { isScannedLanguage, Language } from "./languages";
|
|
import { Logger } from "./logging";
|
|
import { DatabaseCreationTimings, EventReport } from "./status-report";
|
|
import { endTracingForCluster } from "./tracer-config";
|
|
import { validateSarifFileSchema } from "./upload-lib";
|
|
import * as util from "./util";
|
|
|
|
export class CodeQLAnalysisError extends Error {
|
|
queriesStatusReport: QueriesStatusReport;
|
|
|
|
constructor(queriesStatusReport: QueriesStatusReport, message: string) {
|
|
super(message);
|
|
|
|
this.name = "CodeQLAnalysisError";
|
|
this.queriesStatusReport = queriesStatusReport;
|
|
}
|
|
}
|
|
|
|
export interface QueriesStatusReport {
|
|
/**
|
|
* Time taken in ms to run queries for cpp (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_cpp_duration_ms?: number;
|
|
/**
|
|
* Time taken in ms to run queries for csharp (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_csharp_duration_ms?: number;
|
|
/**
|
|
* Time taken in ms to run queries for go (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_go_duration_ms?: number;
|
|
/**
|
|
* Time taken in ms to run queries for java (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_java_duration_ms?: number;
|
|
/**
|
|
* Time taken in ms to run queries for javascript (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_javascript_duration_ms?: number;
|
|
/**
|
|
* Time taken in ms to run queries for python (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_python_duration_ms?: number;
|
|
/**
|
|
* Time taken in ms to run queries for ruby (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_ruby_duration_ms?: number;
|
|
/** Time taken in ms to run queries for swift (or undefined if this language was not analyzed).
|
|
*
|
|
* The "builtin" designation is now outdated with the move to CLI config parsing: this is the time
|
|
* taken to run _all_ the queries.
|
|
*/
|
|
analyze_builtin_queries_swift_duration_ms?: number;
|
|
|
|
/** Time taken in ms to interpret results for cpp (or undefined if this language was not analyzed). */
|
|
interpret_results_cpp_duration_ms?: number;
|
|
/** Time taken in ms to interpret results for csharp (or undefined if this language was not analyzed). */
|
|
interpret_results_csharp_duration_ms?: number;
|
|
/** Time taken in ms to interpret results for go (or undefined if this language was not analyzed). */
|
|
interpret_results_go_duration_ms?: number;
|
|
/** Time taken in ms to interpret results for java (or undefined if this language was not analyzed). */
|
|
interpret_results_java_duration_ms?: number;
|
|
/** Time taken in ms to interpret results for javascript (or undefined if this language was not analyzed). */
|
|
interpret_results_javascript_duration_ms?: number;
|
|
/** Time taken in ms to interpret results for python (or undefined if this language was not analyzed). */
|
|
interpret_results_python_duration_ms?: number;
|
|
/** Time taken in ms to interpret results for ruby (or undefined if this language was not analyzed). */
|
|
interpret_results_ruby_duration_ms?: number;
|
|
/** Time taken in ms to interpret results for swift (or undefined if this language was not analyzed). */
|
|
interpret_results_swift_duration_ms?: number;
|
|
|
|
/** Name of language that errored during analysis (or undefined if no language failed). */
|
|
analyze_failure_language?: string;
|
|
/** Reports on discrete events associated with this status report. */
|
|
event_reports?: EventReport[];
|
|
}
|
|
|
|
async function setupPythonExtractor(
|
|
logger: Logger,
|
|
features: FeatureEnablement,
|
|
codeql: CodeQL,
|
|
) {
|
|
const codeqlPython = process.env["CODEQL_PYTHON"];
|
|
if (codeqlPython === undefined || codeqlPython.length === 0) {
|
|
// If CODEQL_PYTHON is not set, no dependencies were installed, so we don't need to do anything
|
|
return;
|
|
}
|
|
|
|
if (await isPythonDependencyInstallationDisabled(codeql, features)) {
|
|
logger.warning(
|
|
"We recommend that you remove the CODEQL_PYTHON environment variable from your workflow. This environment variable was originally used to specify a Python executable that included the dependencies of your Python code, however Python analysis no longer uses these dependencies." +
|
|
"\nIf you used CODEQL_PYTHON to force the version of Python to analyze as, please use CODEQL_EXTRACTOR_PYTHON_ANALYSIS_VERSION instead, such as 'CODEQL_EXTRACTOR_PYTHON_ANALYSIS_VERSION=2.7' or 'CODEQL_EXTRACTOR_PYTHON_ANALYSIS_VERSION=3.11'.",
|
|
);
|
|
return;
|
|
}
|
|
|
|
const scriptsFolder = path.resolve(__dirname, "../python-setup");
|
|
|
|
let output = "";
|
|
const options = {
|
|
listeners: {
|
|
stdout: (data: Buffer) => {
|
|
output += data.toString();
|
|
},
|
|
},
|
|
};
|
|
|
|
await new toolrunner.ToolRunner(
|
|
codeqlPython,
|
|
[path.join(scriptsFolder, "find_site_packages.py")],
|
|
options,
|
|
).exec();
|
|
logger.info(`Setting LGTM_INDEX_IMPORT_PATH=${output}`);
|
|
process.env["LGTM_INDEX_IMPORT_PATH"] = output;
|
|
|
|
output = "";
|
|
await new toolrunner.ToolRunner(
|
|
codeqlPython,
|
|
["-c", "import sys; print(sys.version_info[0])"],
|
|
options,
|
|
).exec();
|
|
logger.info(`Setting LGTM_PYTHON_SETUP_VERSION=${output}`);
|
|
process.env["LGTM_PYTHON_SETUP_VERSION"] = output;
|
|
}
|
|
|
|
export async function createdDBForScannedLanguages(
|
|
codeql: CodeQL,
|
|
config: configUtils.Config,
|
|
logger: Logger,
|
|
features: FeatureEnablement,
|
|
) {
|
|
for (const language of config.languages) {
|
|
if (
|
|
isScannedLanguage(language) &&
|
|
!dbIsFinalized(config, language, logger)
|
|
) {
|
|
logger.startGroup(`Extracting ${language}`);
|
|
|
|
if (language === Language.python) {
|
|
await setupPythonExtractor(logger, features, codeql);
|
|
}
|
|
|
|
await codeql.extractScannedLanguage(config, language);
|
|
logger.endGroup();
|
|
}
|
|
}
|
|
}
|
|
|
|
export function dbIsFinalized(
|
|
config: configUtils.Config,
|
|
language: Language,
|
|
logger: Logger,
|
|
) {
|
|
const dbPath = util.getCodeQLDatabasePath(config, language);
|
|
try {
|
|
const dbInfo = yaml.load(
|
|
fs.readFileSync(path.resolve(dbPath, "codeql-database.yml"), "utf8"),
|
|
) as { inProgress?: boolean };
|
|
return !("inProgress" in dbInfo);
|
|
} catch (e) {
|
|
logger.warning(
|
|
`Could not check whether database for ${language} was finalized. Assuming it is not.`,
|
|
);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
async function finalizeDatabaseCreation(
|
|
config: configUtils.Config,
|
|
threadsFlag: string,
|
|
memoryFlag: string,
|
|
logger: Logger,
|
|
features: FeatureEnablement,
|
|
): Promise<DatabaseCreationTimings> {
|
|
const codeql = await getCodeQL(config.codeQLCmd);
|
|
|
|
const extractionStart = performance.now();
|
|
await createdDBForScannedLanguages(codeql, config, logger, features);
|
|
const extractionTime = performance.now() - extractionStart;
|
|
|
|
const trapImportStart = performance.now();
|
|
for (const language of config.languages) {
|
|
if (dbIsFinalized(config, language, logger)) {
|
|
logger.info(
|
|
`There is already a finalized database for ${language} at the location where the CodeQL Action places databases, so we did not create one.`,
|
|
);
|
|
} else {
|
|
logger.startGroup(`Finalizing ${language}`);
|
|
await codeql.finalizeDatabase(
|
|
util.getCodeQLDatabasePath(config, language),
|
|
threadsFlag,
|
|
memoryFlag,
|
|
);
|
|
logger.endGroup();
|
|
}
|
|
}
|
|
const trapImportTime = performance.now() - trapImportStart;
|
|
|
|
return {
|
|
scanned_language_extraction_duration_ms: Math.round(extractionTime),
|
|
trap_import_duration_ms: Math.round(trapImportTime),
|
|
};
|
|
}
|
|
|
|
// Runs queries and creates sarif files in the given folder
|
|
export async function runQueries(
|
|
sarifFolder: string,
|
|
memoryFlag: string,
|
|
addSnippetsFlag: string,
|
|
threadsFlag: string,
|
|
automationDetailsId: string | undefined,
|
|
config: configUtils.Config,
|
|
logger: Logger,
|
|
features: FeatureEnablement,
|
|
): Promise<QueriesStatusReport> {
|
|
const statusReport: QueriesStatusReport = {};
|
|
|
|
const codeql = await getCodeQL(config.codeQLCmd);
|
|
const queryFlags = [memoryFlag, threadsFlag];
|
|
|
|
for (const language of config.languages) {
|
|
try {
|
|
const sarifFile = path.join(sarifFolder, `${language}.sarif`);
|
|
|
|
// The work needed to generate the query suites
|
|
// is done in the CLI. We just need to make a single
|
|
// call to run all the queries for each language and
|
|
// another to interpret the results.
|
|
logger.startGroup(`Running queries for ${language}`);
|
|
const startTimeRunQueries = new Date().getTime();
|
|
const databasePath = util.getCodeQLDatabasePath(config, language);
|
|
await codeql.databaseRunQueries(databasePath, queryFlags, features);
|
|
logger.debug(`Finished running queries for ${language}.`);
|
|
// TODO should not be using `builtin` here. We should be using `all` instead.
|
|
// The status report does not support `all` yet.
|
|
statusReport[`analyze_builtin_queries_${language}_duration_ms`] =
|
|
new Date().getTime() - startTimeRunQueries;
|
|
|
|
logger.startGroup(`Interpreting results for ${language}`);
|
|
const startTimeInterpretResults = new Date();
|
|
const analysisSummary = await runInterpretResults(
|
|
language,
|
|
undefined,
|
|
sarifFile,
|
|
config.debugMode,
|
|
);
|
|
const endTimeInterpretResults = new Date();
|
|
statusReport[`interpret_results_${language}_duration_ms`] =
|
|
endTimeInterpretResults.getTime() - startTimeInterpretResults.getTime();
|
|
logger.endGroup();
|
|
logger.info(analysisSummary);
|
|
|
|
if (await features.getValue(Feature.QaTelemetryEnabled)) {
|
|
const perQueryAlertCounts = getPerQueryAlertCounts(sarifFile, logger);
|
|
|
|
const perQueryAlertCountEventReport: EventReport = {
|
|
event: "codeql database interpret-results",
|
|
started_at: startTimeInterpretResults.toISOString(),
|
|
completed_at: endTimeInterpretResults.toISOString(),
|
|
exit_status: "success",
|
|
language,
|
|
properties: {
|
|
alertCounts: perQueryAlertCounts,
|
|
},
|
|
};
|
|
|
|
if (statusReport["event_reports"] === undefined) {
|
|
statusReport["event_reports"] = [];
|
|
}
|
|
statusReport["event_reports"].push(perQueryAlertCountEventReport);
|
|
}
|
|
|
|
if (
|
|
!(await util.codeQlVersionAbove(
|
|
codeql,
|
|
CODEQL_VERSION_ANALYSIS_SUMMARY_V2,
|
|
))
|
|
) {
|
|
await runPrintLinesOfCode(language);
|
|
}
|
|
} catch (e) {
|
|
statusReport.analyze_failure_language = language;
|
|
throw new CodeQLAnalysisError(
|
|
statusReport,
|
|
`Error running analysis for ${language}: ${util.wrapError(e).message}`,
|
|
);
|
|
}
|
|
}
|
|
|
|
return statusReport;
|
|
|
|
async function runInterpretResults(
|
|
language: Language,
|
|
queries: string[] | undefined,
|
|
sarifFile: string,
|
|
enableDebugLogging: boolean,
|
|
): Promise<string> {
|
|
const databasePath = util.getCodeQLDatabasePath(config, language);
|
|
return await codeql.databaseInterpretResults(
|
|
databasePath,
|
|
queries,
|
|
sarifFile,
|
|
addSnippetsFlag,
|
|
threadsFlag,
|
|
enableDebugLogging ? "-vv" : "-v",
|
|
automationDetailsId,
|
|
config,
|
|
features,
|
|
logger,
|
|
);
|
|
}
|
|
|
|
/** Get an object with all queries and their counts parsed from a SARIF file path. */
|
|
function getPerQueryAlertCounts(
|
|
sarifPath: string,
|
|
log: Logger,
|
|
): Record<string, number> {
|
|
validateSarifFileSchema(sarifPath, log);
|
|
const sarifObject = JSON.parse(
|
|
fs.readFileSync(sarifPath, "utf8"),
|
|
) as util.SarifFile;
|
|
// We do not need to compute fingerprints because we are not sending data based off of locations.
|
|
|
|
// Generate the query: alert count object
|
|
const perQueryAlertCounts: Record<string, number> = {};
|
|
|
|
// All rules (queries), from all results, from all runs
|
|
for (const sarifRun of sarifObject.runs) {
|
|
if (sarifRun.results) {
|
|
for (const result of sarifRun.results) {
|
|
const query = result.rule?.id || result.ruleId;
|
|
if (query) {
|
|
perQueryAlertCounts[query] = (perQueryAlertCounts[query] || 0) + 1;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
return perQueryAlertCounts;
|
|
}
|
|
|
|
async function runPrintLinesOfCode(language: Language): Promise<string> {
|
|
const databasePath = util.getCodeQLDatabasePath(config, language);
|
|
return await codeql.databasePrintBaseline(databasePath);
|
|
}
|
|
}
|
|
|
|
export async function runFinalize(
|
|
outputDir: string,
|
|
threadsFlag: string,
|
|
memoryFlag: string,
|
|
config: configUtils.Config,
|
|
logger: Logger,
|
|
features: FeatureEnablement,
|
|
): Promise<DatabaseCreationTimings> {
|
|
try {
|
|
await del(outputDir, { force: true });
|
|
} catch (error: any) {
|
|
if (error?.code !== "ENOENT") {
|
|
throw error;
|
|
}
|
|
}
|
|
await fs.promises.mkdir(outputDir, { recursive: true });
|
|
|
|
const timings = await finalizeDatabaseCreation(
|
|
config,
|
|
threadsFlag,
|
|
memoryFlag,
|
|
logger,
|
|
features,
|
|
);
|
|
|
|
// WARNING: This does not _really_ end tracing, as the tracer will restore its
|
|
// critical environment variables and it'll still be active for all processes
|
|
// launched from this build step.
|
|
// However, it will stop tracing for all steps past the codeql-action/analyze
|
|
// step.
|
|
// Delete variables as specified by the end-tracing script
|
|
await endTracingForCluster(config);
|
|
return timings;
|
|
}
|
|
|
|
export async function runCleanup(
|
|
config: configUtils.Config,
|
|
cleanupLevel: string,
|
|
logger: Logger,
|
|
): Promise<void> {
|
|
logger.startGroup("Cleaning up databases");
|
|
for (const language of config.languages) {
|
|
const codeql = await getCodeQL(config.codeQLCmd);
|
|
const databasePath = util.getCodeQLDatabasePath(config, language);
|
|
await codeql.databaseCleanup(databasePath, cleanupLevel);
|
|
}
|
|
logger.endGroup();
|
|
}
|