r-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:04.755223 72 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:04.777478 72 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:06.255128 73 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:06.263564 73 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:06.826195 74 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:06.839129 74 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:08.312213 75 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:08.318936 75 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:08.899307 60 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:08.907496 60 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:10.360368 61 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 01:33:10.374974 61 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
INFO
I20220726 01:35:17.236651 125 HBProcessor.cpp:40] Machine "ai-plat-test-nebula-cluster-storaged-2.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779 is not registed
I20220726 01:35:31.367146 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 01:35:35.053288 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:15:11.444511 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:15:31.520273 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:16:26.933535 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:25:13.013173 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:25:36.381052 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:27:00.778218 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:27:06.821228 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:30:37.899597 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:30:41.608166 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:39:22.216208 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:41:33.884649 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:42:44.569519 125 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-1.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 02:42:44.571643 125 HBProcessor.cpp:40] Machine "ai-plat-test-nebula-cluster-storaged-1.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779 is not registed
I20220726 02:43:12.492338 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:53:14.881646 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:53:23.499811 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 03:00:43.565696 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 03:00:46.803411 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 03:20:04.885737 125 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
在节点内 ping 是可以ping 通的
[root@ai-plat-test-nebula-cluster-metad-0 nebula]# ping ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local
PING ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140) 56(84) bytes of data.
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=1 ttl=62 time=1.71 ms
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=2 ttl=62 time=0.283 ms
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=3 ttl=62 time=0.345 ms
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=4 ttl=62 time=0.361 ms
[root@ai-plat-test-nebula-cluster-metad-1 nebula]# tail -fn 2000 logs/nebula-metad.ERROR
Log file created at: 2022/07/26 02:41:16
Running on machine: ai-plat-test-nebula-cluster-metad-1
Running duration (h:mm:ss): 0:00:00
Log line format: [IWEF]yyyymmdd hh:mm:ss.uuuuuu threadid file:line] msg
E20220726 02:41:16.079069 1 FileUtils.cpp:377] Failed to read the directory "/usr/local/nebula/data/meta/nebula" (2): No such file or directory
INFO
Log file created at: 2022/07/26 02:41:16
Running on machine: ai-plat-test-nebula-cluster-metad-1
Running duration (h:mm:ss): 0:00:00
Log line format: [IWEF]yyyymmdd hh:mm:ss.uuuuuu threadid file:line] msg
I20220726 02:41:16.012902 1 MetaDaemon.cpp:135] localhost = "ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local":9559
I20220726 02:41:16.023653 1 NebulaStore.cpp:51] Start the raft service...
I20220726 02:41:16.025631 1 NebulaSnapshotManager.cpp:25] Send snapshot is rate limited to 10485760 for each part by default
I20220726 02:41:16.074375 1 RaftexService.cpp:46] Start raft service on 9560
I20220726 02:41:16.077728 1 NebulaStore.cpp:85] Scan the local path, and init the spaces_
E20220726 02:41:16.079069 1 FileUtils.cpp:377] Failed to read the directory "/usr/local/nebula/data/meta/nebula" (2): No such file or directory
I20220726 02:41:16.091737 1 NebulaStore.cpp:271] Init data from partManager for "ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local":9559
I20220726 02:41:16.091754 1 NebulaStore.cpp:387] Create data space 0
I20220726 02:41:16.215380 1 RocksEngine.cpp:97] open rocksdb on /usr/local/nebula/data/meta/nebula/0/data
I20220726 02:41:16.236122 1 NebulaStore.cpp:459] Space 0, part 0 has been added, asLearner 0
I20220726 02:41:16.236162 1 NebulaStore.cpp:78] Register handler...
I20220726 02:41:16.236167 1 MetaDaemonInit.cpp:101] Waiting for the leader elected...
I20220726 02:41:16.236172 1 MetaDaemonInit.cpp:113] Leader has not been elected, sleep 1s
I20220726 02:41:16.484977 60 ThriftClientManager-inl.h:67] resolve "ai-plat-test-nebula-cluster-metad-0.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local":9560 as "100.101.40.32":9560
I20220726 02:41:16.488499 60 ThriftClientManager-inl.h:67] resolve "ai-plat-test-nebula-cluster-metad-2.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local":9560 as "100.74.36.214":9560
I20220726 02:41:17.236260 1 MetaDaemonInit.cpp:113] Leader has not been elected, sleep 1s
I20220726 02:41:18.236408 1 KVBasedClusterIdMan.h:109] There is no clusterId existed in kvstore!
I20220726 02:41:18.236443 1 MetaDaemonInit.cpp:129] I am follower, wait for the leader's clusterId
I20220726 02:41:18.236446 1 MetaDaemonInit.cpp:131] Waiting for the leader's clusterId
I20220726 02:41:19.236593 1 KVBasedClusterIdMan.h:109] There is no clusterId existed in kvstore!
I20220726 02:41:19.237990 1 MetaDaemonInit.cpp:131] Waiting for the leader's clusterId
I20220726 02:41:20.238178 1 MetaDaemonInit.cpp:140] Get meta version is 3
I20220726 02:41:20.238209 1 MetaDaemonInit.cpp:157] Nebula store init succeeded, clusterId 5012000189760346409
I20220726 02:41:20.238214 1 MetaDaemon.cpp:148] Start http service
I20220726 02:41:20.238947 1 MetaDaemonInit.cpp:162] Starting Meta HTTP Service
I20220726 02:41:20.241266 99 WebService.cpp:124] Web service started on HTTP[19559]
I20220726 02:41:20.241307 1 JobManager.cpp:69] Not leader, skip reading remaining jobs
I20220726 02:41:20.241415 1 JobManager.cpp:56] JobManager initialized
I20220726 02:41:20.241426 105 JobManager.cpp:119] JobManager::scheduleThread enter
I20220726 02:41:20.244334 1 MetaDaemon.cpp:213] The meta daemon start on "ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local":9559
I20220726 02:43:02.105170 142 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:52:37.946771 142 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 02:55:20.444234 142 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
I20220726 03:20:46.410261 142 ListHostsProcessor.cpp:343] List Hosts Failed, error E_LEADER_CHANGED
r-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:10.823745 64 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:11.591990 65 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:11.603370 66 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:13.645320 67 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:13.648716 68 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:14.370640 69 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:15.725541 71 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:15.729526 70 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:16.751642 72 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:17.748519 74 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:19.660256 75 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
E20220726 02:41:20.378620 61 ThriftClientManager-inl.h:70] Failed to resolve address for 'ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local': Name or service not known (error=-2): Unknown error -2
INFO
I20220726 03:26:14.160804 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-graphd-1.ai-plat-test-nebula-cluster-graphd-svc.stg-ai-platform.svc.cluster.local":9669, role = GRAPH
I20220726 03:26:14.608219 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-2.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:15.162343 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-graphd-1.ai-plat-test-nebula-cluster-graphd-svc.stg-ai-platform.svc.cluster.local":9669, role = GRAPH
I20220726 03:26:15.609239 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-2.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:16.163241 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-graphd-1.ai-plat-test-nebula-cluster-graphd-svc.stg-ai-platform.svc.cluster.local":9669, role = GRAPH
I20220726 03:26:16.610944 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-2.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:19.401046 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-1.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:20.403025 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-1.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:21.405977 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-1.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:22.144124 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-graphd-0.ai-plat-test-nebula-cluster-graphd-svc.stg-ai-platform.svc.cluster.local":9669, role = GRAPH
I20220726 03:26:22.409160 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-1.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:23.158027 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-graphd-0.ai-plat-test-nebula-cluster-graphd-svc.stg-ai-platform.svc.cluster.local":9669, role = GRAPH
I20220726 03:26:23.271517 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-0.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:24.163991 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-graphd-0.ai-plat-test-nebula-cluster-graphd-svc.stg-ai-platform.svc.cluster.local":9669, role = GRAPH
I20220726 03:26:24.276914 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-0.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
I20220726 03:26:25.165108 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-graphd-0.ai-plat-test-nebula-cluster-graphd-svc.stg-ai-platform.svc.cluster.local":9669, role = GRAPH
I20220726 03:26:25.281967 142 HBProcessor.cpp:33] Receive heartbeat from "ai-plat-test-nebula-cluster-storaged-0.ai-plat-test-nebula-cluster-storaged-headless.stg-ai-platform.svc.cluster.local":9779, role = STORAGE
在节点内是可以ping 通的
[root@ai-plat-test-nebula-cluster-metad-2 nebula]# ping ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local
PING ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140) 56(84) bytes of data.
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=1 ttl=62 time=0.836 ms
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=2 ttl=62 time=0.268 ms
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=3 ttl=62 time=0.391 ms
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=4 ttl=62 time=0.427 ms
64 bytes from ai-plat-test-nebula-cluster-metad-1.ai-plat-test-nebula-cluster-metad-headless.stg-ai-platform.svc.cluster.local (100.87.204.140): icmp_seq=5 ttl=62 time=0.310 ms