所以我搜索并浏览了 SO 上的slug标签,只找到了两个引人注目的解决方案:


那么,在 C# 和/或 .NET 中是否有一个 slugify 算法实现可以正确解决拉丁字符、unicode 和各种其他语言问题?


public static string GenerateSlug(this string phrase) 
    string str = phrase.RemoveAccent().ToLower(); 
    // invalid chars           
    str = Regex.Replace(str, @"[^a-z0-9\s-]", ""); 
    // convert multiple spaces into one space   
    str = Regex.Replace(str, @"\s+", " ").Trim(); 
    // cut and trim 
    str = str.Substring(0, str.Length <= 45 ? str.Length : 45).Trim();   
    str = Regex.Replace(str, @"\s", "-"); // hyphens   
    return str; 

public static string RemoveAccent(this string txt) 
    byte[] bytes = System.Text.Encoding.GetEncoding("Cyrillic").GetBytes(txt); 
    return System.Text.Encoding.ASCII.GetString(bytes); 
在这里,您可以找到一种在 c# 中生成 url slug 的方法。此功能删除所有重音(Marcel 的答案),替换空格,删除无效字符,从末尾修剪破折号并替换“-”或“_”的双重出现


public static string ToUrlSlug(string value){

        //First to lower case
        value = value.ToLowerInvariant();

        //Remove all accents
        var bytes = Encoding.GetEncoding("Cyrillic").GetBytes(value);
        value = Encoding.ASCII.GetString(bytes);

        //Replace spaces
        value = Regex.Replace(value, @"\s", "-", RegexOptions.Compiled);

        //Remove invalid chars
        value = Regex.Replace(value, @"[^a-z0-9\s-_]", "",RegexOptions.Compiled);

        //Trim dashes from end
        value = value.Trim('-', '_');

        //Replace double occurences of - or _
        value = Regex.Replace(value, @"([-_]){2,}", "$1", RegexOptions.Compiled);

        return value ;
  • 使用广泛接受的方法来去除重音。
  • 显式正则表达式缓存以适度提高速度。
  • 更多的单词分隔符被识别并规范化为连字符。


public class UrlSlugger
    // white space, em-dash, en-dash, underscore
    static readonly Regex WordDelimiters = new Regex(@"[\s—–_]", RegexOptions.Compiled);

    // characters that are not valid
    static readonly Regex InvalidChars = new Regex(@"[^a-z0-9\-]", RegexOptions.Compiled);

    // multiple hyphens
    static readonly Regex MultipleHyphens = new Regex(@"-{2,}", RegexOptions.Compiled);

    public static string ToUrlSlug(string value)
        // convert to lower case
        value = value.ToLowerInvariant();

        // remove diacritics (accents)
        value = RemoveDiacritics(value);

        // ensure all word delimiters are hyphens
        value = WordDelimiters.Replace(value, "-");

        // strip out invalid characters
        value = InvalidChars.Replace(value, "");

        // replace multiple hyphens (-) with a single hyphen
        value = MultipleHyphens.Replace(value, "-");

        // trim hyphens (-) from ends
        return value.Trim('-');

    /// See: http://www.siao2.com/2007/05/14/2629747.aspx
    private static string RemoveDiacritics(string stIn)
        string stFormD = stIn.Normalize(NormalizationForm.FormD);
        StringBuilder sb = new StringBuilder();

        for (int ich = 0; ich < stFormD.Length; ich++)
            UnicodeCategory uc = CharUnicodeInfo.GetUnicodeCategory(stFormD[ich]);
            if (uc != UnicodeCategory.NonSpacingMark)

        return (sb.ToString().Normalize(NormalizationForm.FormC));


string original = "测试公司";

// %E6%B5%8B%E8%AF%95%E5%85%AC%E5%8F%B8
string converted = Uri.EscapeDataString(original);


<a href="http://www.example.com/100/%E6%B5%8B%E8%AF%95%E5%85%AC%E5%8F%B8">



注意:为了让Uri.EscapeDataString以这种方式工作,必须启用iriParsing 。


对于那些希望在 C# 中生成 URL Slugs 的人,我建议查看这个相关问题:

Stack Overflow 如何生成对 SEO 友好的 URL?


我遇到的一个问题是 slugification(新词!)是碰撞。例如,如果我有一篇名为“Stack-Overflow”的博文和一篇名为“Stack Overflow”的博文,那么这两个标题的 slug 是相同的。因此,我的 slug 生成器通常必须以某种方式涉及数据库。这可能就是为什么您看不到更多通用解决方案的原因。

  • 删除变音符号(所以我们不只是删除“无效”字符)
  • 结果的最大长度(或在删除变音符号之前 - “早期截断”)
  • 规范化块之间的自定义分隔符
  • 结果可以强制为大写或小写
  • 支持的 unicode 类别的可配置列表
  • 允许字符范围的可配置列表
  • 支持框架 2.0


/// <summary>
/// Defines a set of utilities for creating slug urls.
/// </summary>
public static class Slug
    /// <summary>
    /// Creates a slug from the specified text.
    /// </summary>
    /// <param name="text">The text. If null if specified, null will be returned.</param>
    /// <returns>
    /// A slugged text.
    /// </returns>
    public static string Create(string text)
        return Create(text, (SlugOptions)null);

    /// <summary>
    /// Creates a slug from the specified text.
    /// </summary>
    /// <param name="text">The text. If null if specified, null will be returned.</param>
    /// <param name="options">The options. May be null.</param>
    /// <returns>A slugged text.</returns>
    public static string Create(string text, SlugOptions options)
        if (text == null)
            return null;

        if (options == null)
            options = new SlugOptions();

        string normalised;
        if (options.EarlyTruncate && options.MaximumLength > 0 && text.Length > options.MaximumLength)
            normalised = text.Substring(0, options.MaximumLength).Normalize(NormalizationForm.FormD);
            normalised = text.Normalize(NormalizationForm.FormD);
        int max = options.MaximumLength > 0 ? Math.Min(normalised.Length, options.MaximumLength) : normalised.Length;
        StringBuilder sb = new StringBuilder(max);
        for (int i = 0; i < normalised.Length; i++)
            char c = normalised[i];
            UnicodeCategory uc = char.GetUnicodeCategory(c);
            if (options.AllowedUnicodeCategories.Contains(uc) && options.IsAllowed(c))
                switch (uc)
                    case UnicodeCategory.UppercaseLetter:
                        if (options.ToLower)
                            c = options.Culture != null ? char.ToLower(c, options.Culture) : char.ToLowerInvariant(c);

                    case UnicodeCategory.LowercaseLetter:
                        if (options.ToUpper)
                            c = options.Culture != null ? char.ToUpper(c, options.Culture) : char.ToUpperInvariant(c);

            else if (uc == UnicodeCategory.NonSpacingMark)
                // don't add a separator
                if (options.Separator != null && !EndsWith(sb, options.Separator))

            if (options.MaximumLength > 0 && sb.Length >= options.MaximumLength)

        string result = sb.ToString();

        if (options.MaximumLength > 0 && result.Length > options.MaximumLength)
            result = result.Substring(0, options.MaximumLength);

        if (!options.CanEndWithSeparator && options.Separator != null && result.EndsWith(options.Separator))
            result = result.Substring(0, result.Length - options.Separator.Length);

        return result.Normalize(NormalizationForm.FormC);

    private static bool EndsWith(StringBuilder sb, string text)
        if (sb.Length < text.Length)
            return false;

        for (int i = 0; i < text.Length; i++)
            if (sb[sb.Length - 1 - i] != text[text.Length - 1 - i])
                return false;
        return true;

/// <summary>
/// Defines options for the Slug utility class.
/// </summary>
public class SlugOptions
    /// <summary>
    /// Defines the default maximum length. Currently equal to 80.
    /// </summary>
    public const int DefaultMaximumLength = 80;

    /// <summary>
    /// Defines the default separator. Currently equal to "-".
    /// </summary>
    public const string DefaultSeparator = "-";

    private bool _toLower;
    private bool _toUpper;

    /// <summary>
    /// Initializes a new instance of the <see cref="SlugOptions"/> class.
    /// </summary>
    public SlugOptions()
        MaximumLength = DefaultMaximumLength;
        Separator = DefaultSeparator;
        AllowedUnicodeCategories = new List<UnicodeCategory>();
        AllowedRanges = new List<KeyValuePair<short, short>>();
        AllowedRanges.Add(new KeyValuePair<short, short>((short)'a', (short)'z'));
        AllowedRanges.Add(new KeyValuePair<short, short>((short)'A', (short)'Z'));
        AllowedRanges.Add(new KeyValuePair<short, short>((short)'0', (short)'9'));

    /// <summary>
    /// Gets the allowed unicode categories list.
    /// </summary>
    /// <value>
    /// The allowed unicode categories list.
    /// </value>
    public virtual IList<UnicodeCategory> AllowedUnicodeCategories { get; private set; }

    /// <summary>
    /// Gets the allowed ranges list.
    /// </summary>
    /// <value>
    /// The allowed ranges list.
    /// </value>
    public virtual IList<KeyValuePair<short, short>> AllowedRanges { get; private set; }

    /// <summary>
    /// Gets or sets the maximum length.
    /// </summary>
    /// <value>
    /// The maximum length.
    /// </value>
    public virtual int MaximumLength { get; set; }

    /// <summary>
    /// Gets or sets the separator.
    /// </summary>
    /// <value>
    /// The separator.
    /// </value>
    public virtual string Separator { get; set; }

    /// <summary>
    /// Gets or sets the culture for case conversion.
    /// </summary>
    /// <value>
    /// The culture.
    /// </value>
    public virtual CultureInfo Culture { get; set; }

    /// <summary>
    /// Gets or sets a value indicating whether the string can end with a separator string.
    /// </summary>
    /// <value>
    ///   <c>true</c> if the string can end with a separator string; otherwise, <c>false</c>.
    /// </value>
    public virtual bool CanEndWithSeparator { get; set; }

    /// <summary>
    /// Gets or sets a value indicating whether the string is truncated before normalization.
    /// </summary>
    /// <value>
    ///   <c>true</c> if the string is truncated before normalization; otherwise, <c>false</c>.
    /// </value>
    public virtual bool EarlyTruncate { get; set; }

    /// <summary>
    /// Gets or sets a value indicating whether to lowercase the resulting string.
    /// </summary>
    /// <value>
    ///   <c>true</c> if the resulting string must be lowercased; otherwise, <c>false</c>.
    /// </value>
    public virtual bool ToLower
            return _toLower;
            _toLower = value;
            if (_toLower)
                _toUpper = false;

    /// <summary>
    /// Gets or sets a value indicating whether to uppercase the resulting string.
    /// </summary>
    /// <value>
    ///   <c>true</c> if the resulting string must be uppercased; otherwise, <c>false</c>.
    /// </value>
    public virtual bool ToUpper
            return _toUpper;
            _toUpper = value;
            if (_toUpper)
                _toLower = false;

    /// <summary>
    /// Determines whether the specified character is allowed.
    /// </summary>
    /// <param name="character">The character.</param>
    /// <returns>true if the character is allowed; false otherwise.</returns>
    public virtual bool IsAllowed(char character)
        foreach (var p in AllowedRanges)
            if (character >= p.Key && character <= p.Value)
                return true;
        return false;

    /// <summary>
    /// Replaces the specified character by a given string.
    /// </summary>
    /// <param name="character">The character to replace.</param>
    /// <returns>a string.</returns>
    public virtual string Replace(char character)
        return character.ToString();
于 2015-09-10T06:52:16.043 回答