import * as fs from "fs"; import * as path from "path"; import * as toolrunner from "@actions/exec/lib/toolrunner"; import * as analysisPaths from "./analysis-paths"; import { getCodeQL } from "./codeql"; import * as configUtils from "./config-utils"; import { countLoc, getIdPrefix } from "./count-loc"; import { isScannedLanguage, Language } from "./languages"; import { Logger } from "./logging"; import * as sharedEnv from "./shared-environment"; import { combineSarifFiles } from "./upload-lib"; import * as util from "./util"; export class CodeQLAnalysisError extends Error { queriesStatusReport: QueriesStatusReport; constructor(queriesStatusReport: QueriesStatusReport, message: string) { super(message); this.name = "CodeQLAnalysisError"; this.queriesStatusReport = queriesStatusReport; } } export interface QueriesStatusReport { // Time taken in ms to analyze builtin queries for cpp (or undefined if this language was not analyzed) analyze_builtin_queries_cpp_duration_ms?: number; // Time taken in ms to analyze builtin queries for csharp (or undefined if this language was not analyzed) analyze_builtin_queries_csharp_duration_ms?: number; // Time taken in ms to analyze builtin queries for go (or undefined if this language was not analyzed) analyze_builtin_queries_go_duration_ms?: number; // Time taken in ms to analyze builtin queries for java (or undefined if this language was not analyzed) analyze_builtin_queries_java_duration_ms?: number; // Time taken in ms to analyze builtin queries for javascript (or undefined if this language was not analyzed) analyze_builtin_queries_javascript_duration_ms?: number; // Time taken in ms to analyze builtin queries for python (or undefined if this language was not analyzed) analyze_builtin_queries_python_duration_ms?: number; // Time taken in ms to analyze builtin queries for ruby (or undefined if this language was not analyzed) analyze_builtin_queries_ruby_duration_ms?: number; // Time taken in ms to analyze custom queries for cpp (or undefined if this language was not analyzed) analyze_custom_queries_cpp_duration_ms?: number; // Time taken in ms to analyze custom queries for csharp (or undefined if this language was not analyzed) analyze_custom_queries_csharp_duration_ms?: number; // Time taken in ms to analyze custom queries for go (or undefined if this language was not analyzed) analyze_custom_queries_go_duration_ms?: number; // Time taken in ms to analyze custom queries for java (or undefined if this language was not analyzed) analyze_custom_queries_java_duration_ms?: number; // Time taken in ms to analyze custom queries for javascript (or undefined if this language was not analyzed) analyze_custom_queries_javascript_duration_ms?: number; // Time taken in ms to analyze custom queries for python (or undefined if this language was not analyzed) analyze_custom_queries_python_duration_ms?: number; // Time taken in ms to analyze custom queries for ruby (or undefined if this language was not analyzed) analyze_custom_queries_ruby_duration_ms?: number; // Name of language that errored during analysis (or undefined if no language failed) analyze_failure_language?: string; } async function setupPythonExtractor(logger: Logger) { const codeqlPython = process.env["CODEQL_PYTHON"]; if (codeqlPython === undefined || codeqlPython.length === 0) { // If CODEQL_PYTHON is not set, no dependencies were installed, so we don't need to do anything return; } let output = ""; const options = { listeners: { stdout: (data: Buffer) => { output += data.toString(); }, }, }; await new toolrunner.ToolRunner( codeqlPython, [ "-c", "import os; import pip; print(os.path.dirname(os.path.dirname(pip.__file__)))", ], options ).exec(); logger.info(`Setting LGTM_INDEX_IMPORT_PATH=${output}`); process.env["LGTM_INDEX_IMPORT_PATH"] = output; output = ""; await new toolrunner.ToolRunner( codeqlPython, ["-c", "import sys; print(sys.version_info[0])"], options ).exec(); logger.info(`Setting LGTM_PYTHON_SETUP_VERSION=${output}`); process.env["LGTM_PYTHON_SETUP_VERSION"] = output; } async function createdDBForScannedLanguages( config: configUtils.Config, logger: Logger ) { // Insert the LGTM_INDEX_X env vars at this point so they are set when // we extract any scanned languages. analysisPaths.includeAndExcludeAnalysisPaths(config); const codeql = getCodeQL(config.codeQLCmd); for (const language of config.languages) { if (isScannedLanguage(language)) { logger.startGroup(`Extracting ${language}`); if (language === Language.python) { await setupPythonExtractor(logger); } await codeql.extractScannedLanguage( util.getCodeQLDatabasePath(config, language), language ); logger.endGroup(); } } } async function finalizeDatabaseCreation( config: configUtils.Config, threadsFlag: string, logger: Logger ) { await createdDBForScannedLanguages(config, logger); const codeql = getCodeQL(config.codeQLCmd); for (const language of config.languages) { logger.startGroup(`Finalizing ${language}`); await codeql.finalizeDatabase( util.getCodeQLDatabasePath(config, language), threadsFlag ); logger.endGroup(); } } // Runs queries and creates sarif files in the given folder export async function runQueries( sarifFolder: string, memoryFlag: string, addSnippetsFlag: string, threadsFlag: string, automationDetailsId: string | undefined, config: configUtils.Config, logger: Logger ): Promise<QueriesStatusReport> { const statusReport: QueriesStatusReport = {}; // count the number of lines in the background const locPromise = countLoc( path.resolve(), // config.paths specifies external directories. the current // directory is included in the analysis by default. Replicate // that here. config.paths, config.pathsIgnore, config.languages, logger ); for (const language of config.languages) { logger.startGroup(`Analyzing ${language}`); const queries = config.queries[language]; const packsWithVersion = config.packs[language] || []; const hasBuiltinQueries = queries?.builtin.length > 0; const hasCustomQueries = queries?.custom.length > 0; const hasPackWithCustomQueries = packsWithVersion.length > 0; if (!hasBuiltinQueries && !hasCustomQueries && !hasPackWithCustomQueries) { throw new Error( `Unable to analyse ${language} as no queries were selected for this language` ); } try { let analysisSummaryBuiltIn = ""; const customAnalysisSummaries: string[] = []; if (queries["builtin"].length > 0) { const startTimeBuiltIn = new Date().getTime(); const { sarifFile, stdout } = await runQueryGroup( language, "builtin", createQuerySuiteContents(queries["builtin"]), sarifFolder, undefined ); analysisSummaryBuiltIn = stdout; await injectLinesOfCode(sarifFile, language, locPromise); statusReport[`analyze_builtin_queries_${language}_duration_ms`] = new Date().getTime() - startTimeBuiltIn; } const startTimeCustom = new Date().getTime(); const temporarySarifDir = config.tempDir; const temporarySarifFiles: string[] = []; for (let i = 0; i < queries["custom"].length; ++i) { if (queries["custom"][i].queries.length > 0) { const { sarifFile, stdout } = await runQueryGroup( language, `custom-${i}`, createQuerySuiteContents(queries["custom"][i].queries), temporarySarifDir, queries["custom"][i].searchPath ); customAnalysisSummaries.push(stdout); temporarySarifFiles.push(sarifFile); } } if (packsWithVersion.length > 0) { const { sarifFile, stdout } = await runQueryGroup( language, "packs", createPackSuiteContents(packsWithVersion), temporarySarifDir, undefined ); customAnalysisSummaries.push(stdout); temporarySarifFiles.push(sarifFile); } if (temporarySarifFiles.length > 0) { const sarifFile = path.join(sarifFolder, `${language}-custom.sarif`); fs.writeFileSync(sarifFile, combineSarifFiles(temporarySarifFiles)); await injectLinesOfCode(sarifFile, language, locPromise); statusReport[`analyze_custom_queries_${language}_duration_ms`] = new Date().getTime() - startTimeCustom; } logger.endGroup(); // Print the LoC baseline and the summary results from database analyze for the standard // query suite and (if appropriate) each custom query suite. logger.startGroup(`Analysis summary for ${language}`); printLinesOfCodeSummary(logger, language, await locPromise); logger.info(analysisSummaryBuiltIn); for (const [i, customSummary] of customAnalysisSummaries.entries()) { if (customSummary.trim() === "") { continue; } const description = customAnalysisSummaries.length === 1 ? "custom queries" : `custom query suite ${i + 1}/${customAnalysisSummaries.length}`; logger.info(`Analysis summary for ${description}:`); logger.info(""); logger.info(customSummary); logger.info(""); } logger.endGroup(); } catch (e) { logger.info(e); statusReport.analyze_failure_language = language; throw new CodeQLAnalysisError( statusReport, `Error running analysis for ${language}: ${e}` ); } } return statusReport; async function runQueryGroup( language: Language, type: string, querySuiteContents: string, destinationFolder: string, searchPath: string | undefined ): Promise<{ sarifFile: string; stdout: string }> { const databasePath = util.getCodeQLDatabasePath(config, language); // Pass the queries to codeql using a file instead of using the command // line to avoid command line length restrictions, particularly on windows. const querySuitePath = `${databasePath}-queries-${type}.qls`; fs.writeFileSync(querySuitePath, querySuiteContents); logger.debug( `Query suite file for ${language}-${type}...\n${querySuiteContents}` ); const sarifFile = path.join(destinationFolder, `${language}-${type}.sarif`); const codeql = getCodeQL(config.codeQLCmd); const databaseAnalyzeStdout = await codeql.databaseAnalyze( databasePath, sarifFile, searchPath, querySuitePath, memoryFlag, addSnippetsFlag, threadsFlag, automationDetailsId ); logger.debug( `SARIF results for database ${language} created at "${sarifFile}"` ); return { sarifFile, stdout: databaseAnalyzeStdout }; } } function createQuerySuiteContents(queries: string[]) { return queries.map((q: string) => `- query: ${q}`).join("\n"); } function createPackSuiteContents( packsWithVersion: configUtils.PackWithVersion[] ) { return packsWithVersion.map(packWithVersionToQuerySuiteEntry).join("\n"); } function packWithVersionToQuerySuiteEntry( pack: configUtils.PackWithVersion ): string { let text = `- qlpack: ${pack.packName}`; if (pack.version) { text += `${"\n"} version: ${pack.version}`; } return text; } export async function runAnalyze( outputDir: string, memoryFlag: string, addSnippetsFlag: string, threadsFlag: string, automationDetailsId: string | undefined, config: configUtils.Config, logger: Logger ): Promise<QueriesStatusReport> { // Delete the tracer config env var to avoid tracing ourselves delete process.env[sharedEnv.ODASA_TRACER_CONFIGURATION]; fs.mkdirSync(outputDir, { recursive: true }); logger.info("Finalizing database creation"); await finalizeDatabaseCreation(config, threadsFlag, logger); logger.info("Analyzing database"); const queriesStats = await runQueries( outputDir, memoryFlag, addSnippetsFlag, threadsFlag, automationDetailsId, config, logger ); return { ...queriesStats }; } async function injectLinesOfCode( sarifFile: string, language: Language, locPromise: Promise<Partial<Record<Language, number>>> ) { const lineCounts = await locPromise; const idPrefix = getIdPrefix(language); if (language in lineCounts) { const sarif = JSON.parse(fs.readFileSync(sarifFile, "utf8")); if (Array.isArray(sarif.runs)) { for (const run of sarif.runs) { const ruleId = `${idPrefix}/summary/lines-of-code`; run.properties = run.properties || {}; run.properties.metricResults = run.properties.metricResults || []; const rule = run.properties.metricResults.find( // the rule id can be in either of two places (r) => r.ruleId === ruleId || r.rule?.id === ruleId ); // only add the baseline value if the rule already exists if (rule) { rule.baseline = lineCounts[language]; } } } fs.writeFileSync(sarifFile, JSON.stringify(sarif)); } } function printLinesOfCodeSummary( logger: Logger, language: Language, lineCounts: Partial<Record<Language, number>> ) { if (language in lineCounts) { logger.info( `Counted ${lineCounts[language]} lines of code for ${language} as a baseline.` ); } }