2025-01-15
ยง
|
13:09 |
<elukey> |
restart wdqs-blazegraph.service on wdqs1013 - failed http probes |
[production] |
13:06 |
<elukey> |
`elukey@puppetmaster1001:~$ sudo puppet cert destroy graphite.discovery.wmnet` |
[production] |
13:05 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depool db1163 T383689', diff saved to https://phabricator.wikimedia.org/P72073 and previous config saved to /var/cache/conftool/dbconfig/20250115-130511-marostegui.json |
[production] |
13:03 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Promote db1184 to s1 primary T383689', diff saved to https://phabricator.wikimedia.org/P72072 and previous config saved to /var/cache/conftool/dbconfig/20250115-130354-root.json |
[production] |
13:03 |
<jelto@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2368 to wikikube-worker2227 - jelto@cumin1002" |
[production] |
13:03 |
<marostegui> |
Starting s1 eqiad failover from db1163 to db1184 - T383689 |
[production] |
12:59 |
<jelto@cumin1002> |
START - Cookbook sre.dns.netbox |
[production] |
12:58 |
<jelto@cumin1002> |
START - Cookbook sre.hosts.rename from mw2368 to wikikube-worker2227 |
[production] |
12:58 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Remove db1184 from API T383689', diff saved to https://phabricator.wikimedia.org/P72071 and previous config saved to /var/cache/conftool/dbconfig/20250115-125818-root.json |
[production] |
12:58 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw2367 to wikikube-worker2226 |
[production] |
12:57 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on 34 hosts with reason: Primary switchover s1 T383689 |
[production] |
12:57 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2226 |
[production] |
12:57 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Set db1184 with weight 0 T383689', diff saved to https://phabricator.wikimedia.org/P72070 and previous config saved to /var/cache/conftool/dbconfig/20250115-125732-root.json |
[production] |
12:57 |
<jelto@cumin1002> |
START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2226 |
[production] |
12:57 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
12:57 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2367 to wikikube-worker2226 - jelto@cumin1002" |
[production] |
12:57 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 1:00:00 on 34 hosts with reason: Primary switchover s1 T383689 |
[production] |
12:57 |
<jelto@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2367 to wikikube-worker2226 - jelto@cumin1002" |
[production] |
12:53 |
<jelto@cumin1002> |
START - Cookbook sre.dns.netbox |
[production] |
12:53 |
<jelto@cumin1002> |
START - Cookbook sre.hosts.rename from mw2367 to wikikube-worker2226 |
[production] |
12:52 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw2366 to wikikube-worker2225 |
[production] |
12:51 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2225 |
[production] |
12:51 |
<jelto@cumin1002> |
START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2225 |
[production] |
12:51 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
12:51 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2366 to wikikube-worker2225 - jelto@cumin1002" |
[production] |
12:50 |
<jelto@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2366 to wikikube-worker2225 - jelto@cumin1002" |
[production] |
12:46 |
<jelto@cumin1002> |
START - Cookbook sre.dns.netbox |
[production] |
12:46 |
<jelto@cumin1002> |
START - Cookbook sre.hosts.rename from mw2366 to wikikube-worker2225 |
[production] |
12:45 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.hosts.rename (exit_code=0) from mw2359 to wikikube-worker2224 |
[production] |
12:44 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2224 |
[production] |
12:44 |
<jelto@cumin1002> |
START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2224 |
[production] |
12:44 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.dns.netbox (exit_code=0) |
[production] |
12:44 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2359 to wikikube-worker2224 - jelto@cumin1002" |
[production] |
12:43 |
<jelto@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2359 to wikikube-worker2224 - jelto@cumin1002" |
[production] |
12:40 |
<jelto@cumin1002> |
START - Cookbook sre.dns.netbox |
[production] |
12:39 |
<jelto@cumin1002> |
START - Cookbook sre.hosts.rename from mw2359 to wikikube-worker2224 |
[production] |
12:35 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Remove db2130 from dbctl T383766', diff saved to https://phabricator.wikimedia.org/P72069 and previous config saved to /var/cache/conftool/dbconfig/20250115-123501-marostegui.json |
[production] |
12:30 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host mw[2359,2366-2368].codfw.wmnet |
[production] |
12:28 |
<jelto@cumin1002> |
START - Cookbook sre.k8s.pool-depool-node depool for host mw[2359,2366-2368].codfw.wmnet |
[production] |
12:24 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depool db2130 T374623', diff saved to https://phabricator.wikimedia.org/P72068 and previous config saved to /var/cache/conftool/dbconfig/20250115-122419-marostegui.json |
[production] |
12:10 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on db[2134,2160,2234].codfw.wmnet with reason: maintenance |
[production] |
12:10 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on db[2134,2160,2234].codfw.wmnet with reason: maintenance |
[production] |
12:02 |
<kart_> |
Updated cxserver to 2025-01-15-103159-production (T377966) |
[production] |
11:59 |
<kartik@deploy2002> |
helmfile [eqiad] DONE helmfile.d/services/cxserver: apply |
[production] |
11:59 |
<kartik@deploy2002> |
helmfile [eqiad] START helmfile.d/services/cxserver: apply |
[production] |
11:58 |
<kartik@deploy2002> |
helmfile [codfw] DONE helmfile.d/services/cxserver: apply |
[production] |
11:58 |
<kartik@deploy2002> |
helmfile [codfw] START helmfile.d/services/cxserver: apply |
[production] |
11:56 |
<kartik@deploy2002> |
helmfile [staging] DONE helmfile.d/services/cxserver: apply |
[production] |
11:56 |
<kartik@deploy2002> |
helmfile [staging] START helmfile.d/services/cxserver: apply |
[production] |
11:32 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'es1043 (re)pooling @ 100%: Repooling', diff saved to https://phabricator.wikimedia.org/P72067 and previous config saved to /var/cache/conftool/dbconfig/20250115-113210-root.json |
[production] |