206 lines
6.2 KiB
C#
206 lines
6.2 KiB
C#
|
using System;
|
||
|
using System.Collections.Generic;
|
||
|
using System.Globalization;
|
||
|
using System.Text;
|
||
|
|
||
|
namespace GodotTools.ProjectEditor
|
||
|
{
|
||
|
public static class IdentifierUtils
|
||
|
{
|
||
|
public static string SanitizeQualifiedIdentifier(string qualifiedIdentifier, bool allowEmptyIdentifiers)
|
||
|
{
|
||
|
if (string.IsNullOrEmpty(qualifiedIdentifier))
|
||
|
throw new ArgumentException($"{nameof(qualifiedIdentifier)} cannot be empty", nameof(qualifiedIdentifier));
|
||
|
|
||
|
string[] identifiers = qualifiedIdentifier.Split('.');
|
||
|
|
||
|
for (int i = 0; i < identifiers.Length; i++)
|
||
|
{
|
||
|
identifiers[i] = SanitizeIdentifier(identifiers[i], allowEmpty: allowEmptyIdentifiers);
|
||
|
}
|
||
|
|
||
|
return string.Join(".", identifiers);
|
||
|
}
|
||
|
|
||
|
/// <summary>
|
||
|
/// Skips invalid identifier characters including decimal digit numbers at the start of the identifier.
|
||
|
/// </summary>
|
||
|
private static void SkipInvalidCharacters(string source, int startIndex, StringBuilder outputBuilder)
|
||
|
{
|
||
|
for (int i = startIndex; i < source.Length; i++)
|
||
|
{
|
||
|
char @char = source[i];
|
||
|
|
||
|
switch (char.GetUnicodeCategory(@char))
|
||
|
{
|
||
|
case UnicodeCategory.UppercaseLetter:
|
||
|
case UnicodeCategory.LowercaseLetter:
|
||
|
case UnicodeCategory.TitlecaseLetter:
|
||
|
case UnicodeCategory.ModifierLetter:
|
||
|
case UnicodeCategory.LetterNumber:
|
||
|
case UnicodeCategory.OtherLetter:
|
||
|
outputBuilder.Append(@char);
|
||
|
break;
|
||
|
case UnicodeCategory.NonSpacingMark:
|
||
|
case UnicodeCategory.SpacingCombiningMark:
|
||
|
case UnicodeCategory.ConnectorPunctuation:
|
||
|
case UnicodeCategory.DecimalDigitNumber:
|
||
|
// Identifiers may start with underscore
|
||
|
if (outputBuilder.Length > startIndex || @char == '_')
|
||
|
outputBuilder.Append(@char);
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
public static string SanitizeIdentifier(string identifier, bool allowEmpty)
|
||
|
{
|
||
|
if (string.IsNullOrEmpty(identifier))
|
||
|
{
|
||
|
if (allowEmpty)
|
||
|
return "Empty"; // Default value for empty identifiers
|
||
|
|
||
|
throw new ArgumentException($"{nameof(identifier)} cannot be empty if {nameof(allowEmpty)} is false", nameof(identifier));
|
||
|
}
|
||
|
|
||
|
if (identifier.Length > 511)
|
||
|
identifier = identifier.Substring(0, 511);
|
||
|
|
||
|
var identifierBuilder = new StringBuilder();
|
||
|
int startIndex = 0;
|
||
|
|
||
|
if (identifier[0] == '@')
|
||
|
{
|
||
|
identifierBuilder.Append('@');
|
||
|
startIndex += 1;
|
||
|
}
|
||
|
|
||
|
SkipInvalidCharacters(identifier, startIndex, identifierBuilder);
|
||
|
|
||
|
if (identifierBuilder.Length == startIndex)
|
||
|
{
|
||
|
// All characters were invalid so now it's empty. Fill it with something.
|
||
|
identifierBuilder.Append("Empty");
|
||
|
}
|
||
|
|
||
|
identifier = identifierBuilder.ToString();
|
||
|
|
||
|
if (identifier[0] != '@' && IsKeyword(identifier, anyDoubleUnderscore: true))
|
||
|
identifier = '@' + identifier;
|
||
|
|
||
|
return identifier;
|
||
|
}
|
||
|
|
||
|
private static bool IsKeyword(string value, bool anyDoubleUnderscore)
|
||
|
{
|
||
|
// Identifiers that start with double underscore are meant to be used for reserved keywords.
|
||
|
// Only existing keywords are enforced, but it may be useful to forbid any identifier
|
||
|
// that begins with double underscore to prevent issues with future C# versions.
|
||
|
if (anyDoubleUnderscore)
|
||
|
{
|
||
|
if (value.Length > 2 && value[0] == '_' && value[1] == '_' && value[2] != '_')
|
||
|
return true;
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
if (_doubleUnderscoreKeywords.Contains(value))
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
return _keywords.Contains(value);
|
||
|
}
|
||
|
|
||
|
private static readonly HashSet<string> _doubleUnderscoreKeywords = new HashSet<string>
|
||
|
{
|
||
|
"__arglist",
|
||
|
"__makeref",
|
||
|
"__reftype",
|
||
|
"__refvalue",
|
||
|
};
|
||
|
|
||
|
private static readonly HashSet<string> _keywords = new HashSet<string>
|
||
|
{
|
||
|
"as",
|
||
|
"do",
|
||
|
"if",
|
||
|
"in",
|
||
|
"is",
|
||
|
"for",
|
||
|
"int",
|
||
|
"new",
|
||
|
"out",
|
||
|
"ref",
|
||
|
"try",
|
||
|
"base",
|
||
|
"bool",
|
||
|
"byte",
|
||
|
"case",
|
||
|
"char",
|
||
|
"else",
|
||
|
"enum",
|
||
|
"goto",
|
||
|
"lock",
|
||
|
"long",
|
||
|
"null",
|
||
|
"this",
|
||
|
"true",
|
||
|
"uint",
|
||
|
"void",
|
||
|
"break",
|
||
|
"catch",
|
||
|
"class",
|
||
|
"const",
|
||
|
"event",
|
||
|
"false",
|
||
|
"fixed",
|
||
|
"float",
|
||
|
"sbyte",
|
||
|
"short",
|
||
|
"throw",
|
||
|
"ulong",
|
||
|
"using",
|
||
|
"where",
|
||
|
"while",
|
||
|
"yield",
|
||
|
"double",
|
||
|
"extern",
|
||
|
"object",
|
||
|
"params",
|
||
|
"public",
|
||
|
"return",
|
||
|
"sealed",
|
||
|
"sizeof",
|
||
|
"static",
|
||
|
"string",
|
||
|
"struct",
|
||
|
"switch",
|
||
|
"typeof",
|
||
|
"unsafe",
|
||
|
"ushort",
|
||
|
"checked",
|
||
|
"decimal",
|
||
|
"default",
|
||
|
"finally",
|
||
|
"foreach",
|
||
|
"partial",
|
||
|
"private",
|
||
|
"virtual",
|
||
|
"abstract",
|
||
|
"continue",
|
||
|
"delegate",
|
||
|
"explicit",
|
||
|
"implicit",
|
||
|
"internal",
|
||
|
"operator",
|
||
|
"override",
|
||
|
"readonly",
|
||
|
"volatile",
|
||
|
"interface",
|
||
|
"namespace",
|
||
|
"protected",
|
||
|
"unchecked",
|
||
|
"stackalloc",
|
||
|
};
|
||
|
}
|
||
|
}
|