File: ConvertToInterpolatedString\AbstractConvertConcatenationToInterpolatedStringRefactoringProvider.cs
Web Access
Project: src\src\Features\Core\Portable\Microsoft.CodeAnalysis.Features.csproj (Microsoft.CodeAnalysis.Features)
// Licensed to the .NET Foundation under one or more agreements.
// The .NET Foundation licenses this file to you under the MIT license.
// See the LICENSE file in the project root for more information.
 
using System.Collections.Immutable;
using System.Linq;
using System.Threading;
using System.Threading.Tasks;
using Microsoft.CodeAnalysis.CodeActions;
using Microsoft.CodeAnalysis.CodeRefactorings;
using Microsoft.CodeAnalysis.Editing;
using Microsoft.CodeAnalysis.LanguageService;
using Microsoft.CodeAnalysis.PooledObjects;
using Microsoft.CodeAnalysis.Shared.Extensions;
using Microsoft.CodeAnalysis.Simplification;
 
namespace Microsoft.CodeAnalysis.ConvertToInterpolatedString;
 
/// <summary>
/// Code refactoring that converts expressions of the form:  a + b + " str " + d + e
/// into:
///     $"{a + b} str {d}{e}".
/// </summary>
internal abstract class AbstractConvertConcatenationToInterpolatedStringRefactoringProvider<TExpressionSyntax> : CodeRefactoringProvider
    where TExpressionSyntax : SyntaxNode
{
    protected abstract bool SupportsInterpolatedStringHandler(Compilation compilation);
 
    protected abstract string GetTextWithoutQuotes(string text, bool isVerbatimStringLiteral, bool isCharacterLiteral);
 
    public sealed override async Task ComputeRefactoringsAsync(CodeRefactoringContext context)
    {
        var (document, textSpan, cancellationToken) = context;
        var possibleExpressions = await context.GetRelevantNodesAsync<TExpressionSyntax>().ConfigureAwait(false);
 
        var generator = SyntaxGenerator.GetGenerator(document);
        var syntaxFacts = document.GetRequiredLanguageService<ISyntaxFactsService>();
        var semanticModel = await document.GetRequiredSemanticModelAsync(cancellationToken).ConfigureAwait(false);
 
        // let's take the largest (last) StringConcat we can given current textSpan
        var top = possibleExpressions
            .Where(expr => IsStringConcat(syntaxFacts, expr, semanticModel, cancellationToken))
            .LastOrDefault();
 
        if (top == null)
            return;
 
        if (!syntaxFacts.SupportsConstantInterpolatedStrings(document.Project.ParseOptions!))
        {
            // if there is a const keyword, the refactoring shouldn't show because interpolated string is not const string
            var declarator = top.FirstAncestorOrSelf<SyntaxNode>(syntaxFacts.IsVariableDeclarator);
            if (declarator != null && generator.GetModifiers(declarator).IsConst)
                return;
        }
 
        // Currently we can concatenate only full subtrees. Therefore we can't support arbitrary selection. We could
        // theoretically support selecting the selections that correspond to full sub-trees (e.g. prefixes of 
        // correct length but from UX point of view that it would feel arbitrary). 
        // Thus, we only support selection that takes the whole topmost expression. It breaks some leniency around under-selection
        // but it's the best solution so far.
        if (CodeRefactoringHelpers.IsNodeUnderselected(top, textSpan) ||
            IsStringConcat(syntaxFacts, top.Parent, semanticModel, cancellationToken))
        {
            return;
        }
 
        // Now walk down the concatenation collecting all the pieces that we are
        // concatenating.
        using var _ = ArrayBuilder<SyntaxNode>.GetInstance(out var pieces);
        CollectPiecesDown(syntaxFacts, pieces, top, semanticModel, cancellationToken);
 
        var stringLiterals = pieces
            .Where(x => syntaxFacts.IsStringLiteralExpression(x) || syntaxFacts.IsCharacterLiteralExpression(x))
            .ToImmutableArray();
 
        // If the entire expression is just concatenated strings, then don't offer to
        // make an interpolated string.  The user likely manually split this for
        // readability.
        if (stringLiterals.Length == pieces.Count)
            return;
 
        var isVerbatimStringLiteral = false;
        if (stringLiterals.Length > 0)
        {
 
            // Make sure that all the string tokens we're concatenating are the same type
            // of string literal.  i.e. if we have an expression like: @" "" " + " \r\n "
            // then we don't merge this.  We don't want to be munging different types of
            // escape sequences in these strings, so we only support combining the string
            // tokens if they're all the same type.
            var firstStringToken = stringLiterals[0].GetFirstToken();
            isVerbatimStringLiteral = syntaxFacts.IsVerbatimStringLiteral(firstStringToken);
            for (int i = 1, n = stringLiterals.Length; i < n; i++)
            {
                if (isVerbatimStringLiteral != syntaxFacts.IsVerbatimStringLiteral(stringLiterals[i].GetFirstToken()))
                    return;
            }
        }
 
        var piecesArray = pieces.ToImmutable();
        context.RegisterRefactoring(
            CodeAction.Create(
                FeaturesResources.Convert_to_interpolated_string,
                cancellationToken => UpdateDocumentAsync(document, top, isVerbatimStringLiteral, piecesArray, cancellationToken),
                nameof(FeaturesResources.Convert_to_interpolated_string)),
            top.Span);
    }
 
    private async Task<Document> UpdateDocumentAsync(
        Document document, SyntaxNode top, bool isVerbatimStringLiteral, ImmutableArray<SyntaxNode> pieces, CancellationToken cancellationToken)
    {
        var root = await document.GetRequiredSyntaxRootAsync(cancellationToken).ConfigureAwait(false);
        var interpolatedString = await CreateInterpolatedStringAsync(
            document, isVerbatimStringLiteral, pieces, cancellationToken).ConfigureAwait(false);
 
        return document.WithSyntaxRoot(root.ReplaceNode(top, interpolatedString));
    }
 
    protected async Task<SyntaxNode> CreateInterpolatedStringAsync(
        Document document, bool isVerbatimStringLiteral, ImmutableArray<SyntaxNode> pieces, CancellationToken cancellationToken)
    {
        var semanticModel = await document.GetRequiredSemanticModelAsync(cancellationToken).ConfigureAwait(false);
        var supportsInterpolatedStringHandler = this.SupportsInterpolatedStringHandler(semanticModel.Compilation);
 
        var syntaxFacts = document.GetRequiredLanguageService<ISyntaxFactsService>();
        var generator = SyntaxGenerator.GetGenerator(document);
        var startToken = generator
            .CreateInterpolatedStringStartToken(isVerbatimStringLiteral)
            .WithLeadingTrivia(pieces.First().GetLeadingTrivia());
        var endToken = generator
            .CreateInterpolatedStringEndToken()
            .WithTrailingTrivia(pieces.Last().GetTrailingTrivia());
 
        using var _ = ArrayBuilder<SyntaxNode>.GetInstance(pieces.Length, out var content);
        var previousContentWasStringLiteralExpression = false;
        foreach (var piece in pieces)
        {
            var isCharacterLiteral = syntaxFacts.IsCharacterLiteralExpression(piece);
            var currentContentIsStringOrCharacterLiteral = syntaxFacts.IsStringLiteralExpression(piece) || isCharacterLiteral;
            if (currentContentIsStringOrCharacterLiteral)
            {
                var text = piece.GetFirstToken().Text;
                var value = piece.GetFirstToken().Value?.ToString() ?? piece.GetFirstToken().ValueText;
                var textWithEscapedBraces = text.Replace("{", "{{").Replace("}", "}}");
                var valueTextWithEscapedBraces = value.Replace("{", "{{").Replace("}", "}}");
                var textWithoutQuotes = GetTextWithoutQuotes(textWithEscapedBraces, isVerbatimStringLiteral, isCharacterLiteral);
                if (previousContentWasStringLiteralExpression)
                {
                    // Last part we added to the content list was also an interpolated-string-text-node.
                    // We need to combine these as the API for creating an interpolated strings
                    // does not expect to be given a list containing non-contiguous string nodes.
                    // Essentially if we combine '"A" + 1 + "B" + "C"' into '$"A{1}BC"' it must be:
                    //      {InterpolatedStringText}{Interpolation}{InterpolatedStringText}
                    // not:
                    //      {InterpolatedStringText}{Interpolation}{InterpolatedStringText}{InterpolatedStringText}
                    var existingInterpolatedStringTextNode = content.Last();
                    var newText = ConcatenateTextToTextNode(generator, existingInterpolatedStringTextNode, textWithoutQuotes, valueTextWithEscapedBraces);
                    content[^1] = newText;
                }
                else
                {
                    // This is either the first string literal we have encountered or it is the most recent one we've seen
                    // after adding an interpolation.  Add a new interpolated-string-text-node to the list.
                    content.Add(generator.InterpolatedStringText(generator.InterpolatedStringTextToken(textWithoutQuotes, valueTextWithEscapedBraces)));
                }
            }
            else if (syntaxFacts.IsInterpolatedStringExpression(piece) &&
                syntaxFacts.IsVerbatimInterpolatedStringExpression(piece) == isVerbatimStringLiteral)
            {
                // "piece" is itself an interpolated string (of the same "verbatimity" as the new interpolated string)
                // "a" + $"{1+ 1}" -> instead of $"a{$"{1 + 1}"}" inline the interpolated part: $"a{1 + 1}"
                syntaxFacts.GetPartsOfInterpolationExpression(piece, out var _, out var contentParts, out var _);
                foreach (var contentPart in contentParts)
                {
                    // Track the state of currentContentIsStringOrCharacterLiteral for the inlined parts
                    // so any text at the end of piece can be merge with the next string literal:
                    // $"{1 + 1}a" + "b" -> "a" and "b" get merged in the next "pieces" loop
                    currentContentIsStringOrCharacterLiteral = syntaxFacts.IsInterpolatedStringText(contentPart);
                    if (currentContentIsStringOrCharacterLiteral && previousContentWasStringLiteralExpression)
                    {
                        // if piece starts with a text and the previous part was a string, merge the two parts (see also above)
                        // "a" + $"b{1 + 1}" -> "a" and "b" get merged
                        var newText = ConcatenateTextToTextNode(generator, content.Last(), contentPart.GetFirstToken().Text, contentPart.GetFirstToken().ValueText);
                        content[^1] = newText;
                    }
                    else
                    {
                        content.Add(contentPart);
                    }
 
                    // Only the first contentPart can be merged, therefore we set previousContentWasStringLiteralExpression to false
                    previousContentWasStringLiteralExpression = false;
                }
            }
            else
            {
                // Remove `.ToString()` from expression is safe and efficient to do so.
                var converted = TryRemoveToString(piece);
 
                // Add Simplifier annotation to remove superfluous parenthesis after transformation:
                // (1 + 1) + "a" -> $"{1 + 1}a"
                converted = syntaxFacts.IsParenthesizedExpression(converted)
                    ? converted.WithAdditionalAnnotations(Simplifier.Annotation)
                    : converted;
                content.Add(generator.Interpolation(converted.WithoutTrivia()));
            }
            // Update this variable to be true every time we encounter a new string literal expression
            // so we know to concatenate future string literals together if we encounter them.
            previousContentWasStringLiteralExpression = currentContentIsStringOrCharacterLiteral;
        }
 
        return generator.InterpolatedStringExpression(startToken, content, endToken);
 
        SyntaxNode TryRemoveToString(SyntaxNode piece)
        {
            if (supportsInterpolatedStringHandler)
            {
                // if it's a call to object's .ToString (or any override), then we can remove this if the runtime
                // supports interpolated string handlers. This gies the most flexibility to the handler to decide what
                // it wants to do.
                if (syntaxFacts.IsInvocationExpression(piece))
                {
                    syntaxFacts.GetPartsOfInvocationExpression(piece, out var memberAccess, out var argumentList);
                    if (syntaxFacts.IsMemberAccessExpression(memberAccess))
                    {
                        syntaxFacts.GetPartsOfMemberAccessExpression(memberAccess, out var expression, out var name);
                        if (syntaxFacts.GetIdentifierOfSimpleName(name).ValueText == nameof(ToString))
                        {
                            var symbol = semanticModel.GetSymbolInfo(memberAccess, cancellationToken).Symbol as IMethodSymbol;
                            while (symbol?.OverriddenMethod != null)
                                symbol = symbol.OverriddenMethod;
 
                            if (symbol?.ContainingType.SpecialType == SpecialType.System_Object)
                                return expression;
                        }
                    }
                }
            }
 
            return piece;
        }
    }
 
    private static SyntaxNode ConcatenateTextToTextNode(SyntaxGenerator generator, SyntaxNode interpolatedStringTextNode, string textWithoutQuotes, string value)
    {
        var existingText = interpolatedStringTextNode.GetFirstToken().Text;
        var existingValue = interpolatedStringTextNode.GetFirstToken().ValueText;
        var newText = existingText + textWithoutQuotes;
        var newValue = existingValue + value;
        return generator.InterpolatedStringText(generator.InterpolatedStringTextToken(newText, newValue));
    }
 
    private static void CollectPiecesDown(
        ISyntaxFactsService syntaxFacts,
        ArrayBuilder<SyntaxNode> pieces,
        SyntaxNode node,
        SemanticModel semanticModel,
        CancellationToken cancellationToken)
    {
        if (!IsStringConcat(syntaxFacts, node, semanticModel, cancellationToken))
        {
            pieces.Add(node);
            return;
        }
 
        syntaxFacts.GetPartsOfBinaryExpression(node, out var left, out var right);
 
        CollectPiecesDown(syntaxFacts, pieces, left, semanticModel, cancellationToken);
        pieces.Add(right);
    }
 
    private static bool IsStringConcat(
        ISyntaxFactsService syntaxFacts, SyntaxNode? expression,
        SemanticModel semanticModel, CancellationToken cancellationToken)
    {
        if (!syntaxFacts.IsBinaryExpression(expression))
            return false;
 
        return semanticModel.GetSymbolInfo(expression, cancellationToken).Symbol is IMethodSymbol
        {
            MethodKind: MethodKind.BuiltinOperator,
            ContainingType.SpecialType: SpecialType.System_String,
            MetadataName: WellKnownMemberNames.AdditionOperatorName or WellKnownMemberNames.ConcatenateOperatorName,
        };
    }
}