C++ string 类模拟实现：从浅拷贝到深拷贝的深度解析

C++ string 类模拟实现

面试中的经典问题

在 C++ 面试中，面试官常要求手写 string 类的模拟实现。这不仅是考察语法，更是为了验证你对内存管理、资源获取即初始化（RAII）以及三法则（Rule of Three）的理解。

我们先看一个基础版本，看看它存在什么问题：

// 为了和标准库区分，此处使用 String
String {
public:
    // 构造 String 类对象时，如果传递 nullptr 指针，可以认为程序非正常
    String(const char* str = "") {
        if (nullptr == str) {
            assert(false);
            return;
        }
        _str = new char[strlen(str) + 1];
        strcpy(_str, str);
    }

    ~String() {
        if (_str) {
            delete[] _str;
            _str = nullptr;
        }
    }

private:
    char* _str;
};

测试代码：

void TestString() {
    String s1("hello bit!!!");
    String s2(s1);
}

问题分析： 上述 String 类没有显式定义拷贝构造函数与赋值运算符重载，编译器会合成默认的。当用 s1 构造 s2 时，调用的是默认拷贝构造。最终导致的问题是，s1、s2 共用同一块内存空间。在释放时，同一块空间被释放多次，引起程序崩溃。这种拷贝方式称为浅拷贝。

浅拷贝的隐患

浅拷贝也称位拷贝，编译器只是将对象中的值拷贝过来。如果对象中管理资源，最后就会导致多个对象共享同一份资源。当一个对象销毁时就会将该资源释放掉，而此时另一些对象不知道该资源已经被释放，以为还有效，所以当继续对资源进行操作时，就会发生访问违规。

#include "string.h" namespace bit { void string::reserve(size_t n) { if (n > _capacity) { char* tmp = new char[n + 1]; strcpy(tmp, _str); delete[] _str; _str = tmp; _capacity = n; } } void string::push_back(char ch) { if (_size == _capacity) reserve(_capacity == 0 ? 4 : _capacity * 2); _str[_size] = ch; ++_size; _str[_size] = '\0'; } string& string::operator+=(char ch) { push_back(ch); return *this; } void string::append(const char* str) { size_t len = strlen(str); if (_size + len > _capacity) reserve(_size + len > _capacity * 2 ? _size + len : _capacity * 2); strcpy(_str + _size, str); _size += len; } string& string::operator+=(const char* str) { append(str); return *this; } void string::insert(size_t pos, char ch) { assert(pos <= _size); if (_size == _capacity) reserve(_capacity == 0 ? 4 : _capacity * 2); size_t end = _size + 1; while (end > pos) { _str[end] = _str[end - 1]; --end; } _str[pos] = ch; ++_size; } void string::insert(size_t pos, const char* str) { assert(pos <= _size); size_t len = strlen(str); if (_size + len > _capacity) reserve(_size + len > _capacity * 2 ? _size + len : _capacity * 2); size_t end = _size + len; if (len == 0) return; while (end > pos + len - 1) { _str[end] = _str[end - len]; --end; } for (size_t i = 0; i < len; ++i) _str[pos + i] = str[i]; _size += len; } void string::erase(size_t pos, size_t len) { assert(pos < _size); if (len > _size - pos) { _str[pos] = '\0'; _size = pos; } else { for (size_t i = pos + len; i <= _size; i++) _str[i - len] = _str[i]; _size -= len; } } size_t string::find(char ch, size_t pos) { for (size_t i = pos; i < _size; i++) { if (_str[i] == ch) return i; } return npos; } size_t string::find(const char* str, size_t pos) { assert(pos < _size); const char* ptr = strstr(_str + pos, str); if (ptr == nullptr) return npos; else return ptr - _str; } string string::substr(size_t pos, size_t len) { assert(pos < _size); if (len > _size - pos) len = _size - pos; string sub; sub.reserve(len); for (size_t i = 0; i < len; ++i) sub += _str[pos + i]; return sub; } void test_string1() { string s1; string s2("hello world"); cout << s1.c_str() << endl; cout << s2.c_str() << endl; for (size_t i = 0; i < s2.size(); ++i) s2[i] += 2; cout << s2.c_str() << endl; for (auto e : s2) cout << e << " "; cout << endl; string::iterator it = s2.begin(); while (it != s2.end()) { cout << *it << " "; ++it; } } void test_string2() { string s1("hello wwww"); s1 += 'x'; cout << s1.c_str() << endl; s1.insert(3, "sss"); cout << s1.c_str() << endl; s1.erase(3, 2); cout << s1.c_str() << endl; } void test_string3() { string s("666.cpp.zip"); size_t pos = s.find('.'); string suffix = s.substr(pos); cout << suffix.c_str() << endl; string copy(s); cout << copy.c_str() << endl; } bool operator<(const string& s1, const string& s2) { return strcmp(s1.c_str(), s2.c_str()) < 0; } bool operator==(const string& s1, const string& s2) { return strcmp(s1.c_str(), s2.c_str()) == 0; } bool operator>(const string& s1, const string& s2) { return !(s1 < s2 || s1 == s2); } bool operator<=(const string& s1, const string& s2) { return s1 < s2 || s1 == s2; } bool operator>=(const string& s1, const string& s2) { return !(s1 < s2); } bool operator!=(const string& s1, const string& s2) { return !(s1 == s2); } ostream& operator<<(ostream& out, const string& s) { for (auto ch : s) out << ch; return out; } istream& operator>>(istream& in, string& s) { s.clear(); const int N = 256; char buff[N]; int i = 0; char ch; ch = in.get(); while (ch != ' ' && ch != '\n') { buff[i++] = ch; if (i == N - 1) { buff[i] = '\0'; s += buff; i = 0; } s += ch; ch = in.get(); if (i > 0) { buff[i] = '\0'; s += buff; } } return in; } void test_string4() { string s1("hello"); cin >> s1; cout << s1 << endl; cout << "he"; } int main() { bit::test_string4(); return 0; } }

C++ string 类模拟实现：从浅拷贝到深拷贝的深度解析