mirror of
https://github.com/github/codeql.git
synced 2025-12-17 09:13:20 +01:00
355 lines
16 KiB
C#
355 lines
16 KiB
C#
using System.Collections.Generic;
|
|
using System.Linq;
|
|
using Microsoft.CodeAnalysis;
|
|
using Semmle.Util;
|
|
using Semmle.Extraction.CSharp.Entities;
|
|
|
|
namespace Semmle.Extraction.CSharp
|
|
{
|
|
/// <summary>
|
|
/// Implements the comment processor for associating comments with program elements.
|
|
/// Registers locations of comments and program elements,
|
|
/// then generates binding information.
|
|
/// </summary>
|
|
internal class CommentProcessor
|
|
{
|
|
public void AddComment(CommentLine comment)
|
|
{
|
|
comments[comment.Location] = comment;
|
|
}
|
|
|
|
// Comments sorted by location.
|
|
private readonly SortedDictionary<Microsoft.CodeAnalysis.Location, CommentLine> comments = new SortedDictionary<Microsoft.CodeAnalysis.Location, CommentLine>(new LocationComparer());
|
|
|
|
// Program elements sorted by location.
|
|
private readonly SortedDictionary<Microsoft.CodeAnalysis.Location, Label> elements = new SortedDictionary<Microsoft.CodeAnalysis.Location, Label>(new LocationComparer());
|
|
|
|
private readonly Dictionary<Label, Key> duplicationGuardKeys = new Dictionary<Label, Key>();
|
|
|
|
private Key? GetDuplicationGuardKey(Label label)
|
|
{
|
|
if (duplicationGuardKeys.TryGetValue(label, out var duplicationGuardKey))
|
|
return duplicationGuardKey;
|
|
return null;
|
|
}
|
|
|
|
private class LocationComparer : IComparer<Microsoft.CodeAnalysis.Location>
|
|
{
|
|
public int Compare(Microsoft.CodeAnalysis.Location? l1, Microsoft.CodeAnalysis.Location? l2) => CommentProcessor.Compare(l1, l2);
|
|
}
|
|
|
|
/// <summary>
|
|
/// Comparer for two locations, allowing them to be inserted into a sorted list.
|
|
/// </summary>
|
|
/// <param name="l1">First location</param>
|
|
/// <param name="l2">Second location</param>
|
|
/// <returns><0 if l1 before l2, >0 if l1 after l2, else 0.</returns>
|
|
private static int Compare(Microsoft.CodeAnalysis.Location? l1, Microsoft.CodeAnalysis.Location? l2)
|
|
{
|
|
if (object.ReferenceEquals(l1, l2))
|
|
return 0;
|
|
if (l1 is null)
|
|
return -1;
|
|
if (l2 is null)
|
|
return 1;
|
|
|
|
var diff = l1.SourceTree == l2.SourceTree ? 0 : l1.SourceTree!.FilePath.CompareTo(l2.SourceTree!.FilePath);
|
|
if (diff != 0)
|
|
return diff;
|
|
diff = l1.SourceSpan.Start - l2.SourceSpan.Start;
|
|
if (diff != 0)
|
|
return diff;
|
|
return l1.SourceSpan.End - l2.SourceSpan.End;
|
|
}
|
|
|
|
/// <summary>
|
|
/// Called by the populator when there is a program element which can have comments.
|
|
/// </summary>
|
|
/// <param name="elementLabel">The label of the element in the trap file.</param>
|
|
/// <param name="duplicationGuardKey">The duplication guard key of the element, if any.</param>
|
|
/// <param name="loc">The location of the element.</param>
|
|
public void AddElement(Label elementLabel, Key? duplicationGuardKey, Microsoft.CodeAnalysis.Location? loc)
|
|
{
|
|
if (loc is not null && loc.IsInSource)
|
|
elements[loc] = elementLabel;
|
|
if (duplicationGuardKey is not null)
|
|
duplicationGuardKeys[elementLabel] = duplicationGuardKey;
|
|
}
|
|
|
|
// Ensure that commentBlock and element refer to the same file
|
|
// which can happen when processing multiple files.
|
|
private static void EnsureSameFile(Comments.CommentBlock commentBlock, ref KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? element)
|
|
{
|
|
if (element is not null && element.Value.Key.SourceTree != commentBlock.Location.SourceTree)
|
|
element = null;
|
|
}
|
|
|
|
/// <summary>
|
|
/// Generate the bindings between a comment and program elements.
|
|
/// Called once for each commentBlock.
|
|
/// </summary>
|
|
///
|
|
/// <param name="commentBlock">The comment block.</param>
|
|
/// <param name="previousElement">The element before the comment block.</param>
|
|
/// <param name="nextElement">The element after the comment block.</param>
|
|
/// <param name="parentElement">The parent element of the comment block.</param>
|
|
/// <param name="callback">Output binding information.</param>
|
|
private void GenerateBindings(
|
|
Comments.CommentBlock commentBlock,
|
|
KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? previousElement,
|
|
KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? nextElement,
|
|
KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? parentElement,
|
|
CommentBindingCallback callback
|
|
)
|
|
{
|
|
EnsureSameFile(commentBlock, ref previousElement);
|
|
EnsureSameFile(commentBlock, ref nextElement);
|
|
EnsureSameFile(commentBlock, ref parentElement);
|
|
|
|
if (previousElement is not null)
|
|
{
|
|
var key = previousElement.Value.Value;
|
|
callback(key, GetDuplicationGuardKey(key), commentBlock, CommentBinding.Before);
|
|
}
|
|
|
|
if (nextElement is not null)
|
|
{
|
|
var key = nextElement.Value.Value;
|
|
callback(key, GetDuplicationGuardKey(key), commentBlock, CommentBinding.After);
|
|
}
|
|
|
|
if (parentElement is not null)
|
|
{
|
|
var key = parentElement.Value.Value;
|
|
callback(key, GetDuplicationGuardKey(key), commentBlock, CommentBinding.Parent);
|
|
}
|
|
|
|
// Heuristic to decide which is the "best" element associated with the comment.
|
|
KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? bestElement;
|
|
|
|
if (previousElement is not null && previousElement.Value.Key.EndLine() == commentBlock.Location.StartLine())
|
|
{
|
|
// 1. If the comment is on the same line as the previous element, use that
|
|
bestElement = previousElement;
|
|
}
|
|
else if (nextElement is not null && nextElement.Value.Key.StartLine() == commentBlock.Location.EndLine())
|
|
{
|
|
// 2. If the comment is on the same line as the next element, use that
|
|
bestElement = nextElement;
|
|
}
|
|
else if (nextElement is not null && previousElement is not null &&
|
|
previousElement.Value.Key.EndLine() + 1 == commentBlock.Location.StartLine() &&
|
|
commentBlock.Location.EndLine() + 1 == nextElement.Value.Key.StartLine())
|
|
{
|
|
// 3. If comment is equally between two elements, use the parentElement
|
|
// because it's ambiguous whether the comment refers to the next or previous element
|
|
bestElement = parentElement;
|
|
}
|
|
else if (nextElement is not null && nextElement.Value.Key.StartLine() == commentBlock.Location.EndLine() + 1)
|
|
{
|
|
// 4. If there is no gap after the comment, use "nextElement"
|
|
bestElement = nextElement;
|
|
}
|
|
else if (previousElement is not null && previousElement.Value.Key.EndLine() + 1 == commentBlock.Location.StartLine())
|
|
{
|
|
// 5. If there is no gap before the comment, use previousElement
|
|
bestElement = previousElement;
|
|
}
|
|
else
|
|
{
|
|
// 6. Otherwise, bind the comment to the parent block.
|
|
bestElement = parentElement;
|
|
|
|
/* if parentElement==null, then there is no best element. The comment is effectively orphaned.
|
|
*
|
|
* This can be caused by comments that are not in a type declaration.
|
|
* Due to restrictions in the dbscheme, the comment cannot be associated with the "file"
|
|
* which is not an element, and the "using" declarations are not emitted by the extractor.
|
|
*/
|
|
}
|
|
|
|
if (bestElement is not null)
|
|
{
|
|
var label = bestElement.Value.Value;
|
|
callback(label, GetDuplicationGuardKey(label), commentBlock, CommentBinding.Best);
|
|
}
|
|
}
|
|
|
|
// Stores element nesting information in a stack.
|
|
// Top of stack = most nested element, based on Location.
|
|
private class ElementStack
|
|
{
|
|
// Invariant: the top of the stack must be contained by items below it.
|
|
private readonly Stack<KeyValuePair<Microsoft.CodeAnalysis.Location, Label>> elementStack = new();
|
|
|
|
/// <summary>
|
|
/// Add a new element to the stack.
|
|
/// </summary>
|
|
/// The stack is maintained.
|
|
/// <param name="value">The new element to push.</param>
|
|
public void Push(KeyValuePair<Microsoft.CodeAnalysis.Location, Label> value)
|
|
{
|
|
// Maintain the invariant by popping existing elements
|
|
while (elementStack.Count > 0 && !elementStack.Peek().Key.Contains(value.Key))
|
|
elementStack.Pop();
|
|
|
|
elementStack.Push(value);
|
|
}
|
|
|
|
/// <summary>
|
|
/// Locate the parent of a comment with location l.
|
|
/// </summary>
|
|
/// <param name="l">The location of the comment.</param>
|
|
/// <returns>An element completely containing l, or null if none found.</returns>
|
|
public KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? FindParent(Microsoft.CodeAnalysis.Location l) =>
|
|
elementStack.Where(v => v.Key.Contains(l)).FirstOrNull();
|
|
|
|
/// <summary>
|
|
/// Finds the element on the stack immediately preceding the comment at l.
|
|
/// </summary>
|
|
/// <param name="l">The location of the comment.</param>
|
|
/// <returns>The element before l, or null.</returns>
|
|
public KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? FindBefore(Microsoft.CodeAnalysis.Location l)
|
|
{
|
|
return elementStack
|
|
.Where(v => v.Key.SourceSpan.End < l.SourceSpan.Start)
|
|
.LastOrNull();
|
|
}
|
|
|
|
/// <summary>
|
|
/// Finds the element after the comment.
|
|
/// </summary>
|
|
/// <param name="comment">The location of the comment.</param>
|
|
/// <param name="next">The next element.</param>
|
|
/// <returns>The next element.</returns>
|
|
public KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? FindAfter(Microsoft.CodeAnalysis.Location comment, KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? next)
|
|
{
|
|
var p = FindParent(comment);
|
|
return next.HasValue && p.HasValue && p.Value.Key.Before(next.Value.Key) ? null : next;
|
|
}
|
|
}
|
|
|
|
// Generate binding information for one CommentBlock.
|
|
private void GenerateBindings(
|
|
Comments.CommentBlock block,
|
|
ElementStack elementStack,
|
|
KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? nextElement,
|
|
CommentBindingCallback cb
|
|
)
|
|
{
|
|
if (block.CommentLines.Any())
|
|
{
|
|
GenerateBindings(
|
|
block,
|
|
elementStack.FindBefore(block.Location),
|
|
elementStack.FindAfter(block.Location, nextElement),
|
|
elementStack.FindParent(block.Location),
|
|
cb);
|
|
}
|
|
}
|
|
|
|
/// <summary>
|
|
/// Process comments up until nextElement.
|
|
/// Group comments into blocks, and associate blocks with elements.
|
|
/// </summary>
|
|
///
|
|
/// <param name="commentEnumerator">Enumerator for all comments in the program.</param>
|
|
/// <param name="nextElement">The next element in the list.</param>
|
|
/// <param name="elementStack">A stack of nested program elements.</param>
|
|
/// <param name="cb">Where to send the results.</param>
|
|
/// <returns>true if there are more comments to process, false otherwise.</returns>
|
|
private bool GenerateBindings(
|
|
IEnumerator<KeyValuePair<Microsoft.CodeAnalysis.Location, CommentLine>> commentEnumerator,
|
|
KeyValuePair<Microsoft.CodeAnalysis.Location, Label>? nextElement,
|
|
ElementStack elementStack,
|
|
CommentBindingCallback cb
|
|
)
|
|
{
|
|
Comments.CommentBlock? block = null;
|
|
|
|
// Iterate comments until the commentEnumerator has gone past nextElement
|
|
while (nextElement is null || Compare(commentEnumerator.Current.Value.Location, nextElement.Value.Key) < 0)
|
|
{
|
|
if (block is null)
|
|
block = new Comments.CommentBlock(commentEnumerator.Current.Value);
|
|
|
|
if (!block.CombinesWith(commentEnumerator.Current.Value))
|
|
{
|
|
// Start of a new block, so generate the bindings for the old block first.
|
|
GenerateBindings(block, elementStack, nextElement, cb);
|
|
block = new Comments.CommentBlock(commentEnumerator.Current.Value);
|
|
}
|
|
else
|
|
{
|
|
block.AddCommentLine(commentEnumerator.Current.Value);
|
|
}
|
|
|
|
// Get the next comment.
|
|
if (!commentEnumerator.MoveNext())
|
|
{
|
|
// If there are no more comments, generate the remaining bindings and return false.
|
|
GenerateBindings(block, elementStack, nextElement, cb);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
if (!(block is null))
|
|
GenerateBindings(block, elementStack, nextElement, cb);
|
|
|
|
return true;
|
|
}
|
|
|
|
/// <summary>
|
|
/// Merge comments into blocks and associate comment blocks with program elements.
|
|
/// </summary>
|
|
/// <param name="cb">Callback for the binding information</param>
|
|
public void GenerateBindings(CommentBindingCallback cb)
|
|
{
|
|
/* Algorithm:
|
|
* Do a merge of elements and comments, which are both sorted in location order.
|
|
*
|
|
* Iterate through all elements, and iterate all comment lines between adjacent pairs of elements.
|
|
* Maintain a stack of elements, such that the top of the stack must be fully nested in the
|
|
* element below it. This enables comments to be associated with the "parent" element, as well as
|
|
* elements before, after and "best" element match for a comment.
|
|
*
|
|
* This is an O(n) algorithm because the list of elements and comments are traversed once.
|
|
* (Note that comment processing is O(n.log n) overall due to dictionary of elements and comments.)
|
|
*/
|
|
|
|
var elementStack = new ElementStack();
|
|
|
|
using IEnumerator<KeyValuePair<Microsoft.CodeAnalysis.Location, Label>> elementEnumerator = elements.GetEnumerator();
|
|
using IEnumerator<KeyValuePair<Microsoft.CodeAnalysis.Location, CommentLine>> commentEnumerator = comments.GetEnumerator();
|
|
if (!commentEnumerator.MoveNext())
|
|
{
|
|
// There are no comments to process.
|
|
return;
|
|
}
|
|
|
|
while (elementEnumerator.MoveNext())
|
|
{
|
|
if (!GenerateBindings(commentEnumerator, elementEnumerator.Current, elementStack, cb))
|
|
{
|
|
// No more comments to process.
|
|
return;
|
|
}
|
|
|
|
elementStack.Push(elementEnumerator.Current);
|
|
}
|
|
|
|
// Generate remaining comments at end of file
|
|
GenerateBindings(commentEnumerator, null, elementStack, cb);
|
|
}
|
|
}
|
|
|
|
/// <summary>
|
|
/// Callback for generated comment associations.
|
|
/// </summary>
|
|
/// <param name="elementLabel">The label of the element</param>
|
|
/// <param name="duplicationGuardKey">The duplication guard key of the element, if any</param>
|
|
/// <param name="commentBlock">The comment block associated with the element</param>
|
|
/// <param name="binding">The relationship between the commentblock and the element</param>
|
|
internal delegate void CommentBindingCallback(Label elementLabel, Key? duplicationGuardKey, Comments.CommentBlock commentBlock, CommentBinding binding);
|
|
}
|