1、TiKV2损坏,在BR恢复数据的时候打挂的,目前没找到恢复方式。
2、由于使用了扩展TiKV的方式启动TiKV4。缩容TiKV2,TiKV4上面只有非常少量的数据,数据和leader都没迁移到TiKV4,看了下里面的容量大小只有100G其他的TiKV节点在1.5T的样子。目前通过强制tombstone 。TiKV4已经恢复。
3、集群状态
4、pd中的内容
member
{
"header": {
"cluster_id": 6820705896630752929
},
"members": [
{
"name": "pd-10.204.9.133-2379",
"member_id": 1758101190664893197,
"peer_urls": [
"http://10.204.9.133:2380"
],
"client_urls": [
"http://10.204.9.133:2379"
],
"deploy_path": "/data/tidb-deploy/pd-2379/bin",
"binary_version": "v4.0.0",
"git_hash": "56d4c3d2237f5bf6fb11a794731ed1d95c8020c2"
},
{
"name": "pd-10.204.9.132-2379",
"member_id": 4003923670935905986,
"peer_urls": [
"http://10.204.9.132:2380"
],
"client_urls": [
"http://10.204.9.132:2379"
],
"deploy_path": "/data/tidb-deploy/pd-2379/bin",
"binary_version": "v4.0.0",
"git_hash": "56d4c3d2237f5bf6fb11a794731ed1d95c8020c2"
},
{
"name": "pd-10.204.9.131-2379",
"member_id": 7629576249764497491,
"peer_urls": [
"http://10.204.9.131:2380"
],
"client_urls": [
"http://10.204.9.131:2379"
],
"deploy_path": "/data/tidb-deploy/pd-2379/bin",
"binary_version": "v4.0.0",
"git_hash": "56d4c3d2237f5bf6fb11a794731ed1d95c8020c2"
}
],
"leader": {
"name": "pd-10.204.9.131-2379",
"member_id": 7629576249764497491,
"peer_urls": [
"http://10.204.9.131:2380"
],
"client_urls": [
"http://10.204.9.131:2379"
]
},
"etcd_leader": {
"name": "pd-10.204.9.131-2379",
"member_id": 7629576249764497491,
"peer_urls": [
"http://10.204.9.131:2380"
],
"client_urls": [
"http://10.204.9.131:2379"
],
"deploy_path": "/data/tidb-deploy/pd-2379/bin",
"binary_version": "v4.0.0",
"git_hash": "56d4c3d2237f5bf6fb11a794731ed1d95c8020c2"
}
}
store
{
"count": 4,
"stores": [
{
"store": {
"id": 1,
"address": "10.204.9.87:20160",
"labels": [
{
"key": "host",
"value": "tikv3"
}
],
"version": "4.0.0",
"status_address": "10.204.9.87:20180",
"git_hash": "198a2cea01734ce8f46d55a29708f123f9133944",
"start_timestamp": 1590896656,
"deploy_path": "/data31/tidb-deploy/tikv-20160/bin/tikv-server",
"last_heartbeat": 1590982377840924510,
"state_name": "Up"
},
"status": {
"capacity": "2.865TiB",
"available": "971.2GiB",
"used_size": "1.884TiB",
"leader_count": 27460,
"leader_weight": 1,
"leader_score": 27460,
"leader_size": 2174716,
"region_count": 98447,
"region_weight": 1,
"region_score": 7874999,
"region_size": 7874999,
"start_ts": "2020-05-31T11:44:16+08:00",
"last_heartbeat_ts": "2020-06-01T11:32:57.84092451+08:00",
"uptime": "23h48m41.84092451s"
}
},
{
"store": {
"id": 6,
"address": "10.204.9.85:20160",
"labels": [
{
"key": "host",
"value": "tikv1"
}
],
"version": "4.0.0",
"status_address": "10.204.9.85:20180",
"git_hash": "198a2cea01734ce8f46d55a29708f123f9133944",
"start_timestamp": 1590896364,
"deploy_path": "/data31/tidb-deploy/tikv-20160/bin/tikv-server",
"last_heartbeat": 1590982373980992964,
"state_name": "Up"
},
"status": {
"capacity": "2.865TiB",
"available": "989GiB",
"used_size": "1.878TiB",
"leader_count": 53012,
"leader_weight": 1,
"leader_score": 53012,
"leader_size": 4145438,
"region_count": 98447,
"region_weight": 1,
"region_score": 7874999,
"region_size": 7874999,
"start_ts": "2020-05-31T11:39:24+08:00",
"last_heartbeat_ts": "2020-06-01T11:32:53.980992964+08:00",
"uptime": "23h53m29.980992964s"
}
},
{
"store": {
"id": 88,
"address": "10.204.9.90:3930",
"labels": [
{
"key": "engine",
"value": "tiflash"
}
],
"version": "v4.0.0",
"peer_address": "10.204.9.90:20170",
"status_address": "10.204.9.90:20292",
"git_hash": "c51c2c5c18860aaef3b5853f24f8e9cefea167eb",
"start_timestamp": 1590896875,
"last_heartbeat": 1590982377140013325,
"state_name": "Up"
},
"status": {
"capacity": "2.865TiB",
"available": "2.715TiB",
"used_size": "277KiB",
"leader_count": 0,
"leader_weight": 1,
"leader_score": 0,
"leader_size": 0,
"region_count": 0,
"region_weight": 1,
"region_score": 0,
"region_size": 0,
"start_ts": "2020-05-31T11:47:55+08:00",
"last_heartbeat_ts": "2020-06-01T11:32:57.140013325+08:00",
"uptime": "23h45m2.140013325s"
}
},
{
"store": {
"id": 657369,
"address": "10.204.9.90:20161",
"version": "4.0.0",
"status_address": "10.204.9.90:20181",
"git_hash": "198a2cea01734ce8f46d55a29708f123f9133944",
"start_timestamp": 1590896859,
"deploy_path": "/data32/deploy/install/deploy/tikv-20161/bin",
"last_heartbeat": 1590982374154880239,
"state_name": "Up"
},
"status": {
"capacity": "2.865TiB",
"available": "1015GiB",
"used_size": "1.866TiB",
"leader_count": 17975,
"leader_weight": 1,
"leader_score": 17975,
"leader_size": 1554845,
"region_count": 92052,
"region_weight": 1,
"region_score": 7348629,
"region_size": 7348629,
"start_ts": "2020-05-31T11:47:39+08:00",
"last_heartbeat_ts": "2020-06-01T11:32:54.154880239+08:00",
"uptime": "23h45m15.154880239s"
}
}
]
}
最后我准备重建整个集群,这边磁盘都快被打满了。1.5T的数据现在整个容量变成了6T。磁盘快打到70%了