mirror of
https://github.com/github/codeql.git
synced 2025-12-17 01:03:14 +01:00
181 lines
6.3 KiB
C#
181 lines
6.3 KiB
C#
using System;
|
|
using System.Collections.Generic;
|
|
using System.IO;
|
|
using System.Linq;
|
|
|
|
namespace Semmle.Extraction.CSharp.DependencyFetching
|
|
{
|
|
/// <summary>
|
|
/// Manages the set of assemblies.
|
|
/// Searches for assembly DLLs, indexes them and provides
|
|
/// a lookup facility from assembly ID to filename.
|
|
/// </summary>
|
|
internal class AssemblyCache
|
|
{
|
|
/// <summary>
|
|
/// Locate all reference files and index them.
|
|
/// </summary>
|
|
/// <param name="paths">
|
|
/// Paths to search. Directories are searched recursively. Files are added directly to the
|
|
/// assembly cache.
|
|
/// </param>
|
|
/// <param name="progressMonitor">Callback for progress.</param>
|
|
public AssemblyCache(IEnumerable<string> paths, ProgressMonitor progressMonitor)
|
|
{
|
|
foreach (var path in paths)
|
|
{
|
|
if (File.Exists(path))
|
|
{
|
|
pendingDllsToIndex.Enqueue(path);
|
|
}
|
|
else
|
|
{
|
|
progressMonitor.FindingFiles(path);
|
|
AddReferenceDirectory(path);
|
|
}
|
|
}
|
|
IndexReferences();
|
|
}
|
|
|
|
/// <summary>
|
|
/// Finds all assemblies nested within a directory
|
|
/// and adds them to its index.
|
|
/// (Indexing is performed at a later stage by IndexReferences()).
|
|
/// </summary>
|
|
/// <param name="dir">The directory to index.</param>
|
|
private void AddReferenceDirectory(string dir)
|
|
{
|
|
foreach (var dll in new DirectoryInfo(dir).EnumerateFiles("*.dll", SearchOption.AllDirectories))
|
|
{
|
|
pendingDllsToIndex.Enqueue(dll.FullName);
|
|
}
|
|
}
|
|
|
|
private static readonly Version emptyVersion = new Version(0, 0, 0, 0);
|
|
|
|
/// <summary>
|
|
/// Indexes all DLLs we have located.
|
|
/// Because this is a potentially time-consuming operation, it is put into a separate stage.
|
|
/// </summary>
|
|
private void IndexReferences()
|
|
{
|
|
// Read all of the files
|
|
foreach (var filename in pendingDllsToIndex)
|
|
{
|
|
IndexReference(filename);
|
|
}
|
|
|
|
// Index "assemblyInfo" by version string
|
|
// The OrderBy is used to ensure that we by default select the highest version number.
|
|
foreach (var info in assemblyInfoByFileName.Values
|
|
.OrderBy(info => info.Name)
|
|
.ThenBy(info => info.NetCoreVersion ?? emptyVersion)
|
|
.ThenBy(info => info.Version ?? emptyVersion))
|
|
{
|
|
foreach (var index in info.IndexStrings)
|
|
{
|
|
assemblyInfoById[index] = info;
|
|
}
|
|
}
|
|
}
|
|
|
|
private void IndexReference(string filename)
|
|
{
|
|
try
|
|
{
|
|
var info = AssemblyInfo.ReadFromFile(filename);
|
|
assemblyInfoByFileName[filename] = info;
|
|
}
|
|
catch (AssemblyLoadException)
|
|
{
|
|
failedAssemblyInfoFileNames.Add(filename);
|
|
}
|
|
}
|
|
|
|
/// <summary>
|
|
/// The number of DLLs which are assemblies.
|
|
/// </summary>
|
|
public int AssemblyCount => assemblyInfoByFileName.Count;
|
|
|
|
/// <summary>
|
|
/// The number of DLLs which weren't assemblies. (E.g. C++).
|
|
/// </summary>
|
|
public int NonAssemblyCount => failedAssemblyInfoFileNames.Count;
|
|
|
|
/// <summary>
|
|
/// Given an assembly id, determine its full info.
|
|
/// </summary>
|
|
/// <param name="id">The given assembly id.</param>
|
|
/// <returns>The information about the assembly.</returns>
|
|
public AssemblyInfo ResolveReference(string id)
|
|
{
|
|
// Fast path if we've already seen this before.
|
|
if (failedAssemblyInfoIds.Contains(id))
|
|
throw new AssemblyLoadException();
|
|
|
|
string assemblyName;
|
|
(id, assemblyName) = AssemblyInfo.ComputeSanitizedAssemblyInfo(id);
|
|
|
|
// Look up the id in our references map.
|
|
if (assemblyInfoById.TryGetValue(id, out var result))
|
|
{
|
|
// The string is in the references map.
|
|
return result;
|
|
}
|
|
|
|
// Fallback position - locate the assembly by its lower-case name only.
|
|
var asmName = assemblyName.ToLowerInvariant();
|
|
|
|
if (assemblyInfoById.TryGetValue(asmName, out result))
|
|
{
|
|
assemblyInfoById[asmName] = result; // Speed up the next time the same string is resolved
|
|
return result;
|
|
}
|
|
|
|
failedAssemblyInfoIds.Add(id); // Fail early next time
|
|
|
|
throw new AssemblyLoadException();
|
|
}
|
|
|
|
/// <summary>
|
|
/// All the assemblies we have indexed.
|
|
/// </summary>
|
|
public IEnumerable<AssemblyInfo> AllAssemblies => assemblyInfoByFileName.Select(a => a.Value);
|
|
|
|
/// <summary>
|
|
/// Retrieve the assembly info of a pre-cached assembly.
|
|
/// </summary>
|
|
/// <param name="filepath">The filename to query.</param>
|
|
/// <returns>The assembly info.</returns>
|
|
public AssemblyInfo GetAssemblyInfo(string filepath)
|
|
{
|
|
if (assemblyInfoByFileName.TryGetValue(filepath, out var info))
|
|
{
|
|
return info;
|
|
}
|
|
|
|
IndexReference(filepath);
|
|
|
|
if (assemblyInfoByFileName.TryGetValue(filepath, out info))
|
|
{
|
|
return info;
|
|
}
|
|
|
|
throw new AssemblyLoadException();
|
|
}
|
|
|
|
private readonly Queue<string> pendingDllsToIndex = new Queue<string>();
|
|
|
|
private readonly Dictionary<string, AssemblyInfo> assemblyInfoByFileName = new Dictionary<string, AssemblyInfo>();
|
|
|
|
// List of DLLs which are not assemblies.
|
|
// We probably don't need to keep this
|
|
private readonly List<string> failedAssemblyInfoFileNames = new List<string>();
|
|
|
|
// Map from assembly id (in various formats) to the full info.
|
|
private readonly Dictionary<string, AssemblyInfo> assemblyInfoById = new Dictionary<string, AssemblyInfo>();
|
|
|
|
private readonly HashSet<string> failedAssemblyInfoIds = new HashSet<string>();
|
|
}
|
|
}
|