Skip to content

Commit d063240

Browse files
author
wuxianrong
committed
The data backup and recovery functions have been added
1 parent 3e19283 commit d063240

26 files changed

Lines changed: 2168 additions & 16 deletions

.github/workflows/pika.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ jobs:
4141
- name: Install Deps
4242
run: |
4343
sudo apt-get update
44-
sudo apt-get install -y autoconf libprotobuf-dev protobuf-compiler clang-tidy
44+
sudo apt-get install -y autoconf libprotobuf-dev protobuf-compiler clang-tidy libssl-dev
4545
4646
- name: Configure CMake
4747
# Configure CMake in a 'build' subdirectory. `CMAKE_BUILD_TYPE` is only required if you are using a single-configuration generator such as make.
@@ -166,8 +166,8 @@ jobs:
166166
- name: Install deps
167167
run: |
168168
dnf update -y
169-
dnf install -y bash cmake wget git autoconf gcc perl-Digest-SHA tcl which tar g++ tar epel-release gcc-c++ libstdc++-devel gcc-toolset-13 binutils
170169
dnf clean all
170+
dnf install -y bash cmake wget git autoconf gcc perl-Digest-SHA tcl which tar g++ tar epel-release gcc-c++ libstdc++-devel gcc-toolset-13 openssl-devel zlib-devel
171171
rm -rf /var/cache/dnf
172172
173173
- name: Set up Go

CMakeLists.txt

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -89,6 +89,18 @@ set(INSTALL_LIBDIR ${STAGED_INSTALL_PREFIX}/lib)
8989
set(INSTALL_LIBDIR_64 ${STAGED_INSTALL_PREFIX}/lib64)
9090
set(CMAKE_PREFIX_PATH ${CMAKE_PREFIX_PATH} ${STAGED_INSTALL_PREFIX})
9191

92+
# Fix __const__ macro conflict with GCC 13+/glibc 2.38+ in existing brpc headers
93+
# This must run during CMake configuration to fix cached/existing headers
94+
if(EXISTS "${INSTALL_INCLUDEDIR}/butil/errno.h")
95+
file(READ "${INSTALL_INCLUDEDIR}/butil/errno.h" ERRNO_H_CONTENT)
96+
string(FIND "${ERRNO_H_CONTENT}" "#ifndef __const__" HAS_CONST_MACRO)
97+
if(NOT HAS_CONST_MACRO EQUAL -1)
98+
message(STATUS "Patching existing brpc errno.h for GCC 13+ compatibility")
99+
string(REPLACE "#ifndef __const__" "#if 0 /* disabled for GCC 13+ compatibility */" ERRNO_H_CONTENT "${ERRNO_H_CONTENT}")
100+
file(WRITE "${INSTALL_INCLUDEDIR}/butil/errno.h" "${ERRNO_H_CONTENT}")
101+
endif()
102+
endif()
103+
92104
execute_process(COMMAND sh ${CMAKE_UTILS_DIR}/Get_OS_Version.sh
93105
OUTPUT_VARIABLE OS_VERSION)
94106

@@ -664,6 +676,12 @@ ExternalProject_Add(brpc
664676
1
665677
UPDATE_COMMAND
666678
""
679+
# Patch to fix __const__ macro conflict with GCC 13+/glibc 2.38+
680+
# The issue is that brpc defines __const__ as __unused__ which conflicts with
681+
# glibc's __glibc_has_attribute(__const__) macro in sys/cdefs.h
682+
# We replace '#ifndef __const__' with '#if 0' to disable the problematic macro
683+
PATCH_COMMAND
684+
sh -c "sed -i.bak 's/#ifndef __const__/#if 0 /' src/butil/errno.h && cat src/butil/errno.h | head -35"
667685
LOG_CONFIGURE
668686
1
669687
LOG_BUILD
@@ -677,16 +695,29 @@ ExternalProject_Add(brpc
677695
-DCMAKE_INSTALL_PREFIX=${STAGED_INSTALL_PREFIX}
678696
-DCMAKE_BUILD_TYPE=${LIB_BUILD_TYPE}
679697
-DCMAKE_PREFIX_PATH=${CMAKE_PREFIX_PATH}
698+
-DCMAKE_FIND_ROOT_PATH=${STAGED_INSTALL_PREFIX}
699+
-DCMAKE_INCLUDE_PATH=${INSTALL_INCLUDEDIR}
700+
-DCMAKE_LIBRARY_PATH=${INSTALL_LIBDIR}
680701
-DWITH_GLOG=ON
681702
-DWITH_SNAPPY=ON
682703
-DBUILD_SHARED_LIBS=OFF
683704
-DDOWNLOAD_GTEST=OFF
705+
-DCMAKE_EXE_LINKER_FLAGS=-L${INSTALL_LIBDIR}\ -L${INSTALL_LIBDIR_64}
684706
BUILD_ALWAYS
685707
1
686708
BUILD_COMMAND
687709
make -j${CPU_CORE}
688710
)
689711

712+
# Fix the installed header file after brpc installation
713+
# This is needed because braft uses the installed headers, not the patched source
714+
# The __const__ macro in butil/errno.h conflicts with glibc 2.38+ / GCC 13+
715+
ExternalProject_Add_Step(brpc fix_installed_headers
716+
COMMAND sh -c "sed -i.bak 's/#ifndef __const__/#if 0 /' ${INSTALL_INCLUDEDIR}/butil/errno.h && cat ${INSTALL_INCLUDEDIR}/butil/errno.h | head -35"
717+
DEPENDEES install
718+
COMMENT "Patching installed brpc headers for GCC 13+ compatibility"
719+
)
720+
690721
if(${OS_VERSION} MATCHES "Rocky" OR ${OS_VERSION} MATCHES "CentOS")
691722
set(BRPC_LIBRARY ${INSTALL_LIBDIR_64}/libbrpc.a)
692723
else()

docs/raft_implementation_review.md

Lines changed: 93 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,93 @@
1+
# Pika Raft 模式实现 Review 文档
2+
3+
## 1. 概述
4+
5+
Pika 的 Raft 模式基于 [braft](https://github.com/baidu/braft) 实现分布式一致性,使用 brpc 进行节点间通信。
6+
7+
**核心特性**
8+
- 强一致性保证
9+
- 自动 Leader 选举
10+
- 基于 RocksDB Checkpoint 的快照机制
11+
12+
## 2. 架构概览
13+
14+
```
15+
┌─────────────────────────────────────────────────────┐
16+
│ Pika Server │
17+
├─────────────────────────────────────────────────────┤
18+
│ Client Request → RaftManager → PikaRaftNode │
19+
│ ↓ │
20+
│ braft::Node │
21+
│ ↓ │
22+
│ PikaStateMachine │
23+
│ ↓ │
24+
│ Storage::OnBinlogWrite() │
25+
│ ↓ │
26+
│ RocksDB │
27+
└─────────────────────────────────────────────────────┘
28+
```
29+
30+
## 3. 核心组件
31+
32+
| 组件 | 文件 | 职责 |
33+
|------|------|------|
34+
| `RaftManager` | [praft.h](../src/praft/include/praft/praft.h) | 管理多个 Raft 节点(每个 DB 一个) |
35+
| `PikaRaftNode` | [praft.h](../src/praft/include/praft/praft.h) | 封装 braft::Node,提供日志追加接口 |
36+
| `PikaStateMachine` | [praft.cc](../src/praft/src/praft.cc) | 实现状态机,处理日志应用和快照 |
37+
| `PPosixFileSystemAdaptor` | [psnapshot.cc](../src/praft/src/psnapshot.cc) | 快照文件系统适配器 |
38+
39+
## 4. 数据流
40+
41+
### 写入流程
42+
1. 客户端发送写命令
43+
2. Storage 层构建 Binlog(Protobuf 格式)
44+
3. 通过 `PikaRaftNode::AppendLog()` 提交到 Raft
45+
4. braft 复制日志到多数节点
46+
5. 提交后 `PikaStateMachine::on_apply()` 被调用
47+
6. 调用 `Storage::OnBinlogWrite()` 写入 RocksDB
48+
49+
### Binlog 格式
50+
51+
定义在 [binlog.proto](../src/praft/src/binlog.proto)
52+
- 支持数据类型:Strings, Hashes, Lists, Sets, ZSets, Streams
53+
- 操作类型:Put, Delete
54+
55+
## 5. 快照机制
56+
57+
- 使用 RocksDB Checkpoint 创建快照
58+
- 快照恢复点基于 `GetSmallestFlushedLogIndex()`
59+
- 通过 `LogIndexOfColumnFamilies` 追踪各 CF 的日志应用进度
60+
61+
## 6. 配置选项
62+
63+
| 配置项 | 默认值 | 说明 |
64+
|--------|--------|------|
65+
| `raft_enabled` | false | 是否启用 Raft |
66+
| `raft_group_id` | "" | Raft Group ID |
67+
| `raft_election_timeout_ms` | 1000 | 选举超时(ms) |
68+
| `raft_snapshot_interval_s` | 3600 | 快照间隔(s) |
69+
70+
## 7. Review 重点
71+
72+
### 正确性
73+
- **日志幂等性**: `IsApplied()` 检查是否已应用,防止重复应用
74+
- **快照一致性**: 使用最小 flushed_log_index 确定快照点
75+
- **WAL 禁用**: Raft 日志提供持久性保证,RocksDB WAL 被禁用
76+
77+
### 性能
78+
- 同步写入等待 Raft 提交(可优化为批量提交)
79+
- Binlog 使用 Protobuf 序列化
80+
81+
### 线程安全
82+
- `LogIndexOfColumnFamilies` 使用 mutex 保护
83+
- braft 保证 `on_apply()` 顺序调用
84+
85+
## 8. 关键代码位置
86+
87+
| 功能 | 文件 |
88+
|------|------|
89+
| 日志应用 | [praft.cc](../src/praft/src/praft.cc) - `on_apply()` |
90+
| Binlog 处理 | [storage.cc](../src/storage/src/storage.cc) - `OnBinlogWrite()` |
91+
| Log Index 追踪 | [log_index.cc](../src/storage/src/log_index.cc) |
92+
| 快照创建 | [psnapshot.cc](../src/praft/src/psnapshot.cc) |
93+
| Raft 命令 | [pika_raft.cc](../src/pika_raft.cc) |

include/pika_db.h

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -94,6 +94,8 @@ class DB : public std::enable_shared_from_this<DB>, public pstd::noncopyable {
9494
std::shared_ptr<storage::Storage> storage() const;
9595
void GetBgSaveMetaData(std::vector<std::string>* fileNames, std::string* snapshot_uuid);
9696
void BgSaveDB();
97+
pstd::Status CreateCheckpoint(const std::string& checkpoint_dir);
98+
pstd::Status LoadDBFromCheckpoint(const std::string& checkpoint_dir);
9799
void SetBinlogIoError();
98100
void SetBinlogIoErrorrelieve();
99101
bool IsBinlogIoError();

include/pika_server.h

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,8 @@ enum TaskType {
7171
kCompactRangeSets,
7272
kCompactRangeZSets,
7373
kCompactRangeList,
74+
kLoadDBFromCheckpoint,
75+
kCreateCheckpoint,
7476
};
7577

7678
struct TaskArg {

src/pika_db.cc

Lines changed: 69 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -67,6 +67,75 @@ void DB::BgSaveDB() {
6767
g_pika_server->BGSaveTaskSchedule(&DoBgSave, static_cast<void*>(bg_task_arg));
6868
}
6969

70+
pstd::Status DB::CreateCheckpoint(const std::string& checkpoint_dir) {
71+
std::string checkpoint_sub_path = checkpoint_dir;
72+
if (!checkpoint_sub_path.empty() && checkpoint_sub_path.back() != '/') {
73+
checkpoint_sub_path.push_back('/');
74+
}
75+
checkpoint_sub_path += db_name_;
76+
77+
if (!pstd::FileExists(checkpoint_sub_path)) {
78+
if (pstd::CreatePath(checkpoint_sub_path, 0755) != 0) {
79+
return Status::IOError("Failed to create checkpoint path", checkpoint_sub_path);
80+
}
81+
}
82+
83+
std::shared_lock guard(dbs_rw_);
84+
auto tasks = storage_->CreateCheckpoint(checkpoint_sub_path);
85+
for (auto& task : tasks) {
86+
auto status = task.get();
87+
if (!status.ok()) {
88+
return Status::Corruption("Create checkpoint failed: " + status.ToString());
89+
}
90+
}
91+
return Status::OK();
92+
}
93+
94+
pstd::Status DB::LoadDBFromCheckpoint(const std::string& checkpoint_dir) {
95+
std::string checkpoint_sub_path = checkpoint_dir;
96+
if (!checkpoint_sub_path.empty() && checkpoint_sub_path.back() != '/') {
97+
checkpoint_sub_path.push_back('/');
98+
}
99+
checkpoint_sub_path += db_name_;
100+
101+
if (!pstd::FileExists(checkpoint_sub_path)) {
102+
return Status::NotFound("Checkpoint dir does not exist: " + checkpoint_sub_path);
103+
}
104+
105+
std::lock_guard<std::shared_mutex> guard(dbs_rw_);
106+
opened_ = false;
107+
108+
auto old_storage = storage_;
109+
storage_.reset();
110+
if (old_storage) {
111+
old_storage->Close();
112+
}
113+
114+
storage_ = std::make_shared<storage::Storage>();
115+
auto checkpoint_tasks = storage_->LoadCheckpoint(checkpoint_sub_path, db_path_);
116+
for (auto& task : checkpoint_tasks) {
117+
auto status = task.get();
118+
if (!status.ok()) {
119+
storage_.reset();
120+
return Status::Corruption("Load checkpoint failed: " + status.ToString());
121+
}
122+
}
123+
124+
storage::StorageOptions storage_options = g_pika_server->storage_options();
125+
auto open_status = storage_->Open(storage_options, db_path_);
126+
if (!open_status.ok()) {
127+
storage_.reset();
128+
return Status::Corruption("Storage open failed: " + open_status.ToString());
129+
}
130+
131+
if (!g_pika_conf->raft_enabled()) {
132+
storage_->DisableWal(false);
133+
}
134+
135+
opened_ = true;
136+
return Status::OK();
137+
}
138+
70139
void DB::SetBinlogIoError() { return binlog_io_error_.store(true); }
71140
void DB::SetBinlogIoErrorrelieve() { return binlog_io_error_.store(false); }
72141
bool DB::IsBinlogIoError() { return binlog_io_error_.load(); }

src/pika_server.cc

Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -497,6 +497,37 @@ Status PikaServer::DoSameThingSpecificDB(const std::set<std::string>& dbs, const
497497
case TaskType::kCompactRangeList:
498498
db_item.second->CompactRange(storage::DataType::kLists, arg.argv[0], arg.argv[1]);
499499
break;
500+
case TaskType::kLoadDBFromCheckpoint: {
501+
// arg.argv[0] should contain checkpoint_path
502+
if (arg.argv.empty()) {
503+
LOG(ERROR) << "LoadDBFromCheckpoint requires checkpoint_path argument";
504+
return Status::InvalidArgument("Missing checkpoint_path");
505+
}
506+
std::string checkpoint_path = arg.argv[0];
507+
auto s = db_item.second->LoadDBFromCheckpoint(checkpoint_path);
508+
if (!s.ok()) {
509+
LOG(ERROR) << "Failed to load DB from checkpoint: " << s.ToString();
510+
return s;
511+
}
512+
LOG(INFO) << "Successfully loaded DB " << db_item.first << " from checkpoint: " << checkpoint_path;
513+
break;
514+
}
515+
case TaskType::kCreateCheckpoint: {
516+
// arg.argv[0] should contain checkpoint_path
517+
if (arg.argv.empty()) {
518+
LOG(ERROR) << "CreateCheckpoint requires checkpoint_path argument";
519+
return Status::InvalidArgument("Missing checkpoint_path");
520+
}
521+
std::string checkpoint_path = arg.argv[0];
522+
auto s = db_item.second->CreateCheckpoint(checkpoint_path);
523+
if (!s.ok()) {
524+
LOG(ERROR) << "Failed to create checkpoint: " << s.ToString();
525+
return s;
526+
}
527+
LOG(INFO) << "Successfully created checkpoint for DB " << db_item.first << " at: " << checkpoint_path;
528+
break;
529+
}
530+
500531
default:
501532
break;
502533
}

src/praft/include/praft/praft.h

Lines changed: 15 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@
1818
#include "braft/raft.h"
1919
#include "braft/storage.h"
2020
#include "braft/util.h"
21+
#include "braft/file_system_adaptor.h"
2122
#include "pstd/include/pstd_mutex.h"
2223
#include "pstd/include/pstd_status.h"
2324
#include "rocksdb/status.h"
@@ -31,6 +32,7 @@ namespace storage {
3132
class Storage;
3233
}
3334

35+
// Forward declarations
3436
namespace pikiwidb {
3537
class Binlog;
3638
}
@@ -74,6 +76,8 @@ class PikaStateMachine : public braft::StateMachine {
7476
PikaStateMachine();
7577
~PikaStateMachine() override = default;
7678

79+
void SetLeaderTerm(std::atomic<int64_t>* leader_term);
80+
7781
// Apply committed log entry
7882
void on_apply(braft::Iterator& iter) override;
7983

@@ -97,7 +101,8 @@ class PikaStateMachine : public braft::StateMachine {
97101
void on_stop_following(const ::braft::LeaderChangeContext& ctx) override;
98102

99103
private:
100-
104+
std::atomic<bool> is_node_first_start_up_{true}; // 标记节点是否首次启动
105+
std::atomic<int64_t>* leader_term_{nullptr};
101106
};
102107

103108
// Raft node wrapper
@@ -130,6 +135,11 @@ class PikaRaftNode {
130135
// Get cluster status information
131136
void GetStatus(std::string* status_str);
132137

138+
void GetLeaderLeaseStatus(braft::LeaderLeaseStatus* status) const;
139+
140+
// Trigger a snapshot creation
141+
pstd::Status DoSnapshot(int64_t self_snapshot_index = 0, bool is_sync = true);
142+
133143
braft::Node* GetRaftNode() { return node_.get(); }
134144

135145
private:
@@ -144,6 +154,10 @@ class PikaRaftNode {
144154
std::string raft_log_uri_;
145155
std::string raft_meta_uri_;
146156
std::string raft_snapshot_uri_;
157+
158+
// Snapshot adaptor
159+
scoped_refptr<braft::FileSystemAdaptor> snapshot_adaptor_;
160+
std::atomic<int64_t> leader_term_{-1};
147161
};
148162

149163
// Raft cluster manager

0 commit comments

Comments
 (0)