可空引用类型底层实现

SunnyFan大约 11 分钟约 3422 字

可空引用类型底层实现

简介

C# 8 引入的可空引用类型（NRT，Nullable Reference Types）是编译时的静态分析特性，不影响运行时行为。理解 NRT 的底层实现——包括可空注解、编译器分析规则、Nullable Attribute 和与泛型的交互——有助于正确使用这一特性消除空引用异常。

特点

1.编译时特性 — 不改变运行时行为
2.Nullable Attribute — 编译器注解系统
3.流分析 — 编译器追踪可空状态
4.泛型约束 — T?/default/notnull
5.null 状态 — 非空、可能空、已空

编译器可空性分析

null 状态追踪

#nullable enable

// 编译器为每个表达式维护 null 状态：
// 1. NotNull — 确定不为 null
// 2. MaybeNull — 可能为 null
// 3. Null — 确定为 null

string notNull = "hello";     // 状态: NotNull
string? maybeNull = null;     // 状态: Null
string? maybeNull2 = GetName(); // 状态: MaybeNull

// 编译器根据赋值和检查更新状态
string? name = GetName();
// name 状态: MaybeNull → 警告：使用前可能为 null
int len = name.Length; // ⚠️ CS8602: 可能的 null 引用

// null 检查后状态变为 NotNull
if (name is not null)
{
    int len2 = name.Length; // ✅ 状态: NotNull
}

// 赋值后状态更新
name = "definite";
int len3 = name.Length; // ✅ 状态: NotNull

// 属性和字段的复杂分析
class Person
{
    public string Name { get; set; } // 非空属性

    public Person(string name)
    {
        Name = name; // 构造函数中初始化
    }

    // 可空自动属性
    public string? Nickname { get; set; }

    // required 属性（C# 11）— 确保初始化
    public required string Email { get; set; }
}

方法的可空性契约

#nullable enable

// 参数和返回值的 null 契约
// 非空参数：调用者保证不为 null
void Process(string name) // name 不能为 null
{
    Console.WriteLine(name.Length); // 安全
}

// 可空返回值：调用者需要处理 null
string? FindName(int id)
{
    return id switch
    {
        1 => "Alice",
        2 => "Bob",
        _ => null // 允许返回 null
    };
}

// 使用
string? result = FindName(3);
if (result is string name) // null 检查 + 类型模式
{
    Process(name); // 安全
}

// ! 操作符（null 饶恕）— 告诉编译器"我确定不为 null"
string? maybeNull = GetName();
Process(maybeNull!); // 编译器不再警告，但运行时可能抛 NullReferenceException
// ⚠️ 慎用！只在确定不会为 null 时使用

Nullable Attribute

编译器注解特性

// NRT 使用以下特性注解元数据（编译器自动添加）：
// [NullableAttribute]     — 标注类型的可空性
// [NullableContextAttribute] — 标注成员的默认可空上下文

// 查看编译器生成的注解
// #nullable enable 时编译的方法，元数据中包含 [NullableContext(2)]
// 2 = enable, 0 = disable, 1 = warnings

// 查看方法签名中的可空注解
var method = typeof(MyClass).GetMethod("FindName");
var attrs = method?.ReturnParameter.GetCustomAttributes(false);
// 包含 NullableAttribute(2) = 可空返回

// 自定义可空注解（用于反射场景）
[return: MaybeNull]
T Find<T>(IEnumerable<T> source, Func<T, bool> predicate)
{
    foreach (var item in source)
        if (predicate(item)) return item;
    return default; // default(T) 对于引用类型为 null
}

// 参数可空性注解
void SetName([DisallowNull] string? name, [AllowNull] string value)
{
    // DisallowNull: 参数类型是可空的，但不接受 null 传入
    // AllowNull: 参数类型是非空的，但允许 null 传入

    // 典型场景：
    // DisallowNull: 属性 getter 返回可空，但 setter 不接受 null
    // AllowNull: 属性 setter 接受 null（如重置为默认值）
}

public string? Config
{
    get => _config;
    [DisallowNull] set => _config = value; // 赋值时不接受 null
}

public string Label
{
    get => _label;
    [AllowNull] set => _label = value ?? "Default"; // 允许 null 赋值
}

private string? _config;
private string _label = "";

MemberNotNull 特性

// 告诉编译器某个方法返回后字段不为 null
class Service
{
    private string _connectionString;
    private HttpClient _client;

    public Service(string connectionString)
    {
        _connectionString = connectionString; // ✅ 初始化
        _client = null!; // ⚠️ 暂时设置，稍后初始化
        Initialize();    // 编译器不知道 Initialize 会设置 _client
    }

    // 告诉编译器 Initialize 执行后 _client 不为 null
    [MemberNotNull(nameof(_client))]
    private void Initialize()
    {
        _client = new HttpClient();
    }

    // 多个字段
    [MemberNotNull(nameof(_connectionString), nameof(_client))]
    private void InitializeAll()
    {
        _connectionString = BuildConnectionString();
        _client = new HttpClient();
    }

    // MemberNotNullWhen — 条件性保证
    [MemberNotNullWhen(true, nameof(_client))]
    private bool TryInitialize()
    {
        try
        {
            _client = new HttpClient();
            return true;
        }
        catch
        {
            return false;
        }
    }
}

泛型与可空性

T? 和泛型约束

#nullable enable

// T? 的行为取决于 T 的约束
// 1. 无约束的 T：T? 表示"default"（引用类型为 null，值类型为 Nullable<T>）
// 2. class 约束：T? 表示引用可空
// 3. struct 约束：T? 表示 Nullable<T>
// 4. notnull 约束（C# 8）：T 必须是非空引用类型或非空值类型

// 无约束泛型
T? FindFirst<T>(IEnumerable<T> source, Func<T, bool> predicate)
{
    foreach (var item in source)
        if (predicate(item)) return item;
    return default; // default(T) 对于引用类型是 null
}

// class 约束 — T 是引用类型
T? FindRef<T>(IEnumerable<T> source, Func<T, bool> predicate) where T : class
{
    foreach (var item in source)
        if (predicate(item)) return item;
    return null; // T? 是可空引用类型
}

// struct 约束 — T 是值类型
T? FindStruct<T>(IEnumerable<T> source, Func<T, bool> predicate) where T : struct
{
    foreach (var item in source)
        if (predicate(item)) return item;
    return null; // T? 是 Nullable<T>
}

// notnull 约束
void Add<TKey, TValue>(TKey key, TValue value)
    where TKey : notnull // key 不能是 null
{
    _dict[key] = value;
}

// default 约束（C# 9）— 允许泛型类型参数为 null
// 用于协变场景

泛型方法中的可空性约束

/// <summary>
/// 泛型方法中正确处理可空性的高级模式
/// </summary>

// 场景：泛型工厂方法
public static class Factory
{
    // 返回值可能为 null — 使用 T?
    public static T? CreateOrDefault<T>(Func<T>? factory = null)
        where T : class
    {
        return factory?.Invoke();
    }

    // 值类型的工厂方法
    public static T? CreateNullable<T>(Func<T>? factory = null)
        where T : struct
    {
        if (factory == null) return null;
        return factory();
    }

    // 混合约束的工厂
    public static T CreateOrThrow<T>(Func<T> factory)
        where T : notnull
    {
        var result = factory();
        if (result is null)
            throw new InvalidOperationException("Factory returned null");
        return result;
    }
}

// 场景：泛型映射器
public static class Mapper
{
    // 映射可能失败 — 返回 T?
    public static TTarget? Map<TSource, TTarget>(
        TSource source,
        Dictionary<string, object> mappings)
        where TTarget : class, new()
    {
        var target = new TTarget();
        foreach (var prop in typeof(TTarget).GetProperties())
        {
            if (mappings.TryGetValue(prop.Name, out var value))
                prop.SetValue(target, value);
        }
        return target;
    }

    // 使用 ArgumentNullException 验证非空
    public static void ValidateNotNull<T>(T value, string paramName)
        where T : notnull
    {
        if (value is null)
            throw new ArgumentNullException(paramName);
    }
}

可空性在接口设计中的应用

/// <summary>
/// 接口设计中的可空性最佳实践
/// </summary>

// ❌ 不好的接口设计 — 可空性不明确
public interface IBadRepository
{
    object GetById(int id);       // 返回什么？null？抛异常？
    void Save(object entity);     // entity 能为 null 吗？
    IEnumerable<object> GetAll(); // 永远不为 null？还是可能？
}

// ✅ 好的接口设计 — 明确可空性
public interface IRepository<T> where T : class
{
    T? FindById(int id);           // 可能返回 null
    T GetById(int id);             // 找不到抛异常
    IReadOnlyList<T> GetAll();     // 永远不为 null（空列表而非 null）
    void Add(T entity);            // entity 不为 null（notnull 约束）
    bool TryGet(int id, [NotNullWhen(true)] out T? entity);
}

// 泛型接口中的可空性
public interface IOptional<out T>
{
    bool HasValue { get; }
    T Value { get; } // T 不为 null 时才能访问
}

// 实现
public readonly struct Some<T> : IOptional<T>
{
    private readonly T _value;
    public Some(T value) => _value = value;
    public bool HasValue => true;
    public T Value => _value;
}

public readonly struct None<T> : IOptional<T>
{
    public bool HasValue => false;
    public T Value => throw new InvalidOperationException("No value");
}

可空性感知的泛型容器

#nullable enable

public class SafeDictionary<TKey, TValue> where TKey : notnull
{
    private readonly Dictionary<TKey, TValue> _dict = new();

    // 返回 TValue? 因为键可能不存在
    public TValue? TryGet(TKey key)
    {
        _dict.TryGetValue(key, out var value);
        return value; // 如果不存在返回 default(TValue)
    }

    // 对于值类型，TValue? 是 Nullable<T>
    // 对于引用类型，TValue? 是可空引用
    public TValue GetOrAdd(TKey key, Func<TKey, TValue> factory)
    {
        if (_dict.TryGetValue(key, out var value))
            return value;
        value = factory(key);
        _dict[key] = value;
        return value;
    }

    // KeyValuePair 的可空性
    public KeyValuePair<TKey, TValue>? FindByKey(TKey key)
    {
        if (_dict.TryGetValue(key, out var value))
            return new KeyValuePair<TKey, TValue>(key, value);
        return null; // 可空返回
    }
}

优点

1.编译时检查 — 在编写代码时发现潜在 null 问题
2.文档化 — 方法签名表达 null 契约
3.渐进式 — 可以按文件/方法启用
4.工具支持 — IDE 自动提示和修复

缺点

1.非运行时 — 不提供运行时 null 安全
2.误报 — 某些场景下编译器分析不够精确
3.迁移成本 — 现有项目启用需要大量标注
4.泛型复杂 — 泛型与可空性的交互复杂

编译器流分析的局限性

编译器无法处理的场景

/// <summary>
/// NRT 编译器分析的边界与局限
/// </summary>

// 局限 1：字段可空性不跨方法追踪
class FieldTrackingIssue
{
    private string _name; // 编译器认为可能是 null

    public void Initialize()
    {
        _name = "initialized"; // 编译器知道这里赋值了
    }

    public void Print()
    {
        // 编译器不知道 Initialize 是否已调用
        Console.WriteLine(_name.Length); // 警告 CS8602
    }

    // 解决：使用 [MemberNotNull]
    [MemberNotNull(nameof(_name))]
    public void InitializeSafe()
    {
        _name = "initialized";
    }
}

// 局限 2：跨线程的 null 状态
class ThreadSafetyIssue
{
    private string? _value;

    public void ThreadA()
    {
        _value = "set"; // 线程 A 设置
    }

    public void ThreadB()
    {
        if (_value != null)
        {
            // 编译器认为安全，但另一个线程可能已置空
            Console.WriteLine(_value.Length); // 理论上安全，实际上可能 NRE
        }
    }
}

// 局限 3：字典和集合的索引访问
public void DictionaryAccess(Dictionary<string, string> dict)
{
    // dict[key] 可能抛 KeyNotFoundException，不是 null
    // 但 TryGetValue 的 out 参数可空性需要正确标注
    if (dict.TryGetValue("key", out var value))
    {
        Console.WriteLine(value.Length); // 安全
    }
    // value 在这里是 null，编译器不知道
}

// 局限 4：反射和动态代码
public void ReflectionIssue(Type type)
{
    var property = type.GetProperty("Name");
    // property 可能为 null，编译器会正确提示
    // 但 GetMethod/GetProperty 的返回值是否为 null 取决于运行时

    var value = property?.GetValue(obj);
    // value 是 object?，需要手动检查
    if (value is string s)
    {
        Console.WriteLine(s.Length); // 安全
    }
}

SuppressNullableWarningExpression 的使用

/// <summary>
/// ! 操作符的正确使用场景
/// </summary>

// 场景 1：已知不为 null 但编译器无法推断
public class Service
{
    private readonly string _name;
    public Service()
    {
        // 构造函数中可能通过其他方法初始化
        Init();
        // 编译器不知道 Init 设置了 _name
    }

    private void Init() => _name = "default";

    public void UseName()
    {
        // 如果确定 Init 总是设置 _name
        Console.WriteLine(_name!.Length);
    }
}

// 场景 2：泛型工厂方法
public T Create<T>() where T : new()
{
    var result = new T();
    // 某些场景下 T 可能有可空字段
    return result;
}

// 场景 3：与未启用 NRT 的代码交互
public void InteropWithOldCode()
{
    object? result = LegacyLibrary.GetData();
    // 确定不为 null 但编译器不知道
    var data = (MyData)result!; // 断言不为 null
}

// ⚠️ 不要滥用 ! — 它绕过了编译器检查
// 只在以下情况使用：
// 1. 你 100% 确定不为 null
// 2. 有其他机制保证不为 null（如契约、初始化方法）
// 3. 临时迁移代码，后续修复

可空引用类型是纯编译时特性，通过 #nullable enable 启用。编译器为每个表达式维护 null 状态（NotNull/MaybeNull/Null），通过流分析追踪状态变化。[NullableAttribute] 和 [NullableContextAttribute] 写入元数据，供其他项目消费。[MemberNotNull] 告诉编译器方法返回后字段已初始化。泛型中 T? 的行为取决于约束：class 为可空引用、struct 为 Nullable<T>。notnull 约束确保类型参数不为 null。最佳实践：新项目默认启用、使用 ! 前充分验证、优先使用模式匹配检查 null。