1、28万张表,分布在3000个库中,没个库大约100张表,目前计划分多个changefeed进行处理,但ticdc卡住不动了,操作不了无法删除当前的changefeed
2、pd集群在k8s中部署的,3副本,4核、内存8G,磁盘100G,磁盘都是ssd,pd最近24小时的监控图如下:
当前pd的leader日志如下:
[2023/02/14 09:00:57.713 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202584] [step=“transfer leader from store 1 to store 5”] [source=create]
[2023/02/14 09:00:57.714 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202584] [from=1] [to=5]
[2023/02/14 09:00:57.715 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202584] [takes=1.684627ms] [operator=“"transfer-hot-read-leader {transfer leader: store 1 to 5} (kind:hot-region,leader, region:1202584(86,17), createAt:2023-02-14 09:00:57.712943653 +0800 CST m=+941027.276799437, startAt:2023-02-14 09:00:57.713414336 +0800 CST m=+941027.277270130, currentStep:1, steps:[transfer leader from store 1 to store 5]) finished"”] [additional-info=]
[2023/02/14 09:00:59.114 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1030033] [operator=“"balance-leader {transfer leader: store 5 to 1} (kind:leader, region:1030033(81,17), createAt:2023-02-14 09:00:59.114682035 +0800 CST m=+941028.678537814, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 1])"”] [additional-info=“{"sourceScore":"236.00","targetScore":"234.00"}”]
[2023/02/14 09:00:59.114 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1030033] [step=“transfer leader from store 5 to store 1”] [source=create]
[2023/02/14 09:00:59.116 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1030033] [from=5] [to=1]
[2023/02/14 09:00:59.116 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1030033] [takes=1.435858ms] [operator=“"balance-leader {transfer leader: store 5 to 1} (kind:leader, region:1030033(81,17), createAt:2023-02-14 09:00:59.114682035 +0800 CST m=+941028.678537814, startAt:2023-02-14 09:00:59.114890233 +0800 CST m=+941028.678746021, currentStep:1, steps:[transfer leader from store 5 to store 1]) finished"”] [additional-info=“{"sourceScore":"236.00","targetScore":"234.00"}”]
[2023/02/14 09:01:37.726 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1202596] [operator=“"transfer-hot-read-leader {transfer leader: store 1 to 4} (kind:hot-region,leader, region:1202596(88,17), createAt:2023-02-14 09:01:37.726820516 +0800 CST m=+941067.290676272, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 1 to store 4])"”] [additional-info=]
[2023/02/14 09:01:37.727 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202596] [step=“transfer leader from store 1 to store 4”] [source=create]
[2023/02/14 09:01:37.729 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202596] [from=1] [to=4]
[2023/02/14 09:01:37.729 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202596] [takes=2.227342ms] [operator=“"transfer-hot-read-leader {transfer leader: store 1 to 4} (kind:hot-region,leader, region:1202596(88,17), createAt:2023-02-14 09:01:37.726820516 +0800 CST m=+941067.290676272, startAt:2023-02-14 09:01:37.727068308 +0800 CST m=+941067.290924071, currentStep:1, steps:[transfer leader from store 1 to store 4]) finished"”] [additional-info=]
[2023/02/14 09:01:42.193 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1201876] [operator=“"balance-leader {transfer leader: store 5 to 1} (kind:leader, region:1201876(107,17), createAt:2023-02-14 09:01:42.193314649 +0800 CST m=+941071.757170398, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 1])"”] [additional-info=“{"sourceScore":"235.00","targetScore":"234.00"}”]
[2023/02/14 09:01:42.193 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1201876] [step=“transfer leader from store 5 to store 1”] [source=create]
[2023/02/14 09:01:42.194 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1201876] [from=5] [to=1]
[2023/02/14 09:01:42.195 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1201876] [takes=1.671202ms] [operator=“"balance-leader {transfer leader: store 5 to 1} (kind:leader, region:1201876(107,17), createAt:2023-02-14 09:01:42.193314649 +0800 CST m=+941071.757170398, startAt:2023-02-14 09:01:42.193461837 +0800 CST m=+941071.757317621, currentStep:1, steps:[transfer leader from store 5 to store 1]) finished"”] [additional-info=“{"sourceScore":"235.00","targetScore":"234.00"}”]
[2023/02/14 09:01:54.413 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1202580] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 1} (kind:hot-region,leader, region:1202580(87,17), createAt:2023-02-14 09:01:54.413581571 +0800 CST m=+941083.977437355, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 1])"”] [additional-info=]
[2023/02/14 09:01:54.414 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202580] [step=“transfer leader from store 5 to store 1”] [source=create]
[2023/02/14 09:01:54.415 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202580] [from=5] [to=1]
[2023/02/14 09:01:54.415 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202580] [takes=1.654517ms] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 1} (kind:hot-region,leader, region:1202580(87,17), createAt:2023-02-14 09:01:54.413581571 +0800 CST m=+941083.977437355, startAt:2023-02-14 09:01:54.414144201 +0800 CST m=+941083.977999990, currentStep:1, steps:[transfer leader from store 5 to store 1]) finished"”] [additional-info=]
[2023/02/14 09:01:55.714 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1202620] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 4} (kind:hot-region,leader, region:1202620(88,17), createAt:2023-02-14 09:01:55.714092001 +0800 CST m=+941085.277947783, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 4])"”] [additional-info=]
[2023/02/14 09:01:55.714 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202620] [step=“transfer leader from store 5 to store 4”] [source=create]
[2023/02/14 09:01:55.716 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202620] [from=5] [to=4]
[2023/02/14 09:01:55.716 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202620] [takes=2.082143ms] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 4} (kind:hot-region,leader, region:1202620(88,17), createAt:2023-02-14 09:01:55.714092001 +0800 CST m=+941085.277947783, startAt:2023-02-14 09:01:55.714406114 +0800 CST m=+941085.278261902, currentStep:1, steps:[transfer leader from store 5 to store 4]) finished"”] [additional-info=]
[2023/02/14 09:04:54.814 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1202612] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 1} (kind:hot-region,leader, region:1202612(87,17), createAt:2023-02-14 09:04:54.813887497 +0800 CST m=+941264.377743282, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 1])"”] [additional-info=]
[2023/02/14 09:04:54.814 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202612] [step=“transfer leader from store 5 to store 1”] [source=create]
[2023/02/14 09:04:54.815 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202612] [from=5] [to=1]
[2023/02/14 09:04:54.816 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202612] [takes=1.80506ms] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 1} (kind:hot-region,leader, region:1202612(87,17), createAt:2023-02-14 09:04:54.813887497 +0800 CST m=+941264.377743282, startAt:2023-02-14 09:04:54.814324868 +0800 CST m=+941264.378180654, currentStep:1, steps:[transfer leader from store 5 to store 1]) finished"”] [additional-info=]
[2023/02/14 09:04:56.114 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1202624] [operator=“"transfer-hot-read-leader {transfer leader: store 5 to 4} (kind:hot-region,leader, region:1202624(88,17), createAt:2023-02-14 09:04:56.114255348 +0800 CST m=+941265.678111133, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 4])"”] [additional-info=]
[2023/02/14 09:04:56.114 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202624] [step=“transfer leader from store 5 to store 4”] [source=create]
[2023/02/14 09:04:56.116 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202624] [from=5] [to=4]
[2023/02/14 09:04:56.116 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202624] [takes=2.007555ms] [operator=“"transfer-hot-read-leader {transfer leader: store 5 to 4} (kind:hot-region,leader, region:1202624(88,17), createAt:2023-02-14 09:04:56.114255348 +0800 CST m=+941265.678111133, startAt:2023-02-14 09:04:56.114821758 +0800 CST m=+941265.678677547, currentStep:1, steps:[transfer leader from store 5 to store 4]) finished"”] [additional-info=]
[2023/02/14 09:07:55.136 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1202576] [operator=“"transfer-hot-read-leader {transfer leader: store 5 to 4} (kind:hot-region,leader, region:1202576(88,17), createAt:2023-02-14 09:07:55.13624988 +0800 CST m=+941444.700105662, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 4])"”] [additional-info=]
[2023/02/14 09:07:55.136 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202576] [step=“transfer leader from store 5 to store 4”] [source=create]
[2023/02/14 09:07:55.138 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202576] [from=5] [to=4]
[2023/02/14 09:07:55.139 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202576] [takes=2.390309ms] [operator=“"transfer-hot-read-leader {transfer leader: store 5 to 4} (kind:hot-region,leader, region:1202576(88,17), createAt:2023-02-14 09:07:55.13624988 +0800 CST m=+941444.700105662, startAt:2023-02-14 09:07:55.136876198 +0800 CST m=+941444.700731999, currentStep:1, steps:[transfer leader from store 5 to store 4]) finished"”] [additional-info=]
[2023/02/14 09:07:56.515 +08:00] [INFO] [operator_controller.go:437] [“add operator”] [region-id=1202564] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 1} (kind:hot-region,leader, region:1202564(87,17), createAt:2023-02-14 09:07:56.514716191 +0800 CST m=+941446.078571973, startAt:0001-01-01 00:00:00 +0000 UTC, currentStep:0, steps:[transfer leader from store 5 to store 1])"”] [additional-info=]
[2023/02/14 09:07:56.515 +08:00] [INFO] [operator_controller.go:635] [“send schedule command”] [region-id=1202564] [step=“transfer leader from store 5 to store 1”] [source=create]
[2023/02/14 09:07:56.517 +08:00] [INFO] [region.go:543] [“leader changed”] [region-id=1202564] [from=5] [to=1]
[2023/02/14 09:07:56.517 +08:00] [INFO] [operator_controller.go:552] [“operator finish”] [region-id=1202564] [takes=1.917522ms] [operator=“"transfer-hot-write-leader {transfer leader: store 5 to 1} (kind:hot-region,leader, region:1202564(87,17), createAt:2023-02-14 09:07:56.514716191 +0800 CST m=+941446.078571973, startAt:2023-02-14 09:07:56.515752957 +0800 CST m=+941446.079608752, currentStep:1, steps:[transfer leader from store 5 to store 1]) finished"”] [additional-info=]
[2023/02/14 09:15:10.515 +08:00] [INFO] [trace.go:145] [“trace[1611567014] put”] [detail=“{key:/tidb/server/minstartts/fc5f7000-6d43-4523-8270-905245b1c2c2; req_size:92; response_revision:7487222; }”] [duration=102.369641ms] [start=2023/02/14 09:15:10.413 +08:00] [end=2023/02/14 09:15:10.515 +08:00] [steps=“["trace[1611567014] ‘process raft request’ (duration: 102.007675ms)"]”]
[2023/02/14 09:15:10.714 +08:00] [WARN] [util.go:144] [“apply request took too long”] [took=102.086683ms] [expected-duration=100ms] [prefix=] [request=“header:<ID:6749072942850525650 > txn:<compare:<target:VALUE key:"/pd/7194634827558957893/leader" value_size:180 > success:<request_put:<key:"/pd/7194634827558957893/timestamp" value_size:8 >> failure:<>>”] [response=size:20] []
[2023/02/14 09:15:10.714 +08:00] [WARN] [tso.go:314] [“clock offset”] [jet-lag=202.134206ms] [prev-physical=2023/02/14 09:15:10.512 +08:00] [now=2023/02/14 09:15:10.714 +08:00] [update-physical-interval=50ms]
[2023/02/14 09:16:12.714 +08:00] [WARN] [stat_persist.go:20] [trace] [elapsed=196.816581ms] [rows=1] [sql=“INSERT INTO keyviz_axis
(layer_num
,time
,axis
) VALUES (0,"2023-02-14 09:16:12.513","")”]
[2023/02/14 09:29:38.015 +08:00] [WARN] [tso.go:314] [“clock offset”] [jet-lag=203.701776ms] [prev-physical=2023/02/14 09:29:37.811 +08:00] [now=2023/02/14 09:29:38.015 +08:00] [update-physical-interval=50ms]
[2023/02/14 09:37:21.249 +08:00] [INFO] [periodic.go:135] [“starting auto periodic compaction”] [revision=7485358] [compact-period=1h0m0s]
[2023/02/14 09:37:21.250 +08:00] [INFO] [index.go:189] [“compact tree index”] [revision=7485358]
[2023/02/14 09:37:21.250 +08:00] [INFO] [periodic.go:146] [“completed auto periodic compaction”] [revision=7485358] [compact-period=1h0m0s] [took=1h0m0.00881159s]
[2023/02/14 09:37:21.280 +08:00] [INFO] [kvstore_compaction.go:55] [“finished scheduled compaction”] [compact-revision=7485358] [took=29.434239ms]
[2023/02/14 09:44:08.512 +08:00] [WARN] [tso.go:314] [“clock offset”] [jet-lag=194.761498ms] [prev-physical=2023/02/14 09:44:08.317 +08:00] [now=2023/02/14 09:44:08.512 +08:00] [update-physical-interval=50ms]
[2023/02/14 09:45:10.111 +08:00] [WARN] [tso.go:314] [“clock offset”] [jet-lag=195.61578ms] [prev-physical=2023/02/14 09:45:09.916 +08:00] [now=2023/02/14 09:45:10.111 +08:00] [update-physical-interval=50ms]
[2023/02/14 09:45:10.512 +08:00] [INFO] [trace.go:145] [“trace[1405525310] put”] [detail=“{key:/tidb/server/minstartts/fc5f7000-6d43-4523-8270-905245b1c2c2; req_size:92; response_revision:7488498; }”] [duration=100.270714ms] [start=2023/02/14 09:45:10.412 +08:00] [end=2023/02/14 09:45:10.512 +08:00] [steps=“["trace[1405525310] ‘process raft request’ (duration: 99.569087ms)"]”]
[2023/02/14 09:48:16.612 +08:00] [WARN] [tso.go:314] [“clock offset”] [jet-lag=196.066851ms] [prev-physical=2023/02/14 09:48:16.415 +08:00] [now=2023/02/14 09:48:16.612 +08:00] [update-physical-interval=50ms]