2024-11-26
ยง
|
14:08 |
<brouberol@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/airflow-search: apply |
[production] |
14:07 |
<brouberol@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/airflow-search: apply |
[production] |
14:05 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on dns7001.wikimedia.org with reason: host reimage |
[production] |
14:05 |
<brouberol@deploy2002> |
helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/airflow-search: apply |
[production] |
14:01 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host cp7015.magru.wmnet with OS bullseye |
[production] |
14:01 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - fabfur@cumin1002" |
[production] |
14:01 |
<fabfur@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - fabfur@cumin1002" |
[production] |
13:54 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on an-redacteddb1001.eqiad.wmnet with reason: Reclone (T379724) |
[production] |
13:54 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on an-redacteddb1001.eqiad.wmnet with reason: Reclone (T379724) |
[production] |
13:54 |
<ladsgroup@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on clouddb1020.eqiad.wmnet with reason: Reclone (T379724) |
[production] |
13:54 |
<ladsgroup@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on clouddb1020.eqiad.wmnet with reason: Reclone (T379724) |
[production] |
13:49 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host lvs7003.magru.wmnet with OS bullseye |
[production] |
13:49 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - fabfur@cumin1002" |
[production] |
13:49 |
<ladsgroup@cumin1002> |
conftool action : set/pooled=no; selector: name=clouddb1020.eqiad.wmnet,service=s8 |
[production] |
13:46 |
<fabfur@cumin1002> |
START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - fabfur@cumin1002" |
[production] |
13:43 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.reimage for host dns7001.wikimedia.org with OS bullseye |
[production] |
13:40 |
<cmooney@cumin1002> |
END (PASS) - Cookbook sre.hosts.dhcp (exit_code=0) for host dns7001.wikimedia.org |
[production] |
13:38 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on cp7004.magru.wmnet with reason: T376737 |
[production] |
13:38 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on cp7004.magru.wmnet with reason: T376737 |
[production] |
13:35 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cp7015.magru.wmnet with reason: host reimage |
[production] |
13:34 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on cp7010.magru.wmnet with reason: T376737 |
[production] |
13:34 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on cp7010.magru.wmnet with reason: T376737 |
[production] |
13:34 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on cp7003.magru.wmnet with reason: T376737 |
[production] |
13:34 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on cp7003.magru.wmnet with reason: T376737 |
[production] |
13:32 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on cp7015.magru.wmnet with reason: host reimage |
[production] |
13:31 |
<dcaro> |
added cloudcephmon1004 to the ceph mon pool |
[admin] |
13:29 |
<Emperor> |
swift delete wikipedia-commons-local-public.bf b/bf/Schuur_-_Nieuwerbrug_-_20164513_-_RCE.jpg T380738 |
[production] |
13:29 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on cp7003.magru.wmnet with reason: T376737 |
[production] |
13:28 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on cp7003.magru.wmnet with reason: T376737 |
[production] |
13:28 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1 day, 0:00:00 on cp7002.magru.wmnet with reason: T376737 |
[production] |
13:28 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 1 day, 0:00:00 on cp7002.magru.wmnet with reason: T376737 |
[production] |
13:28 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on cp7002.magru.wmnet with reason: T376737 |
[production] |
13:28 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 4:00:00 on cp7002.magru.wmnet with reason: T376737 |
[production] |
13:27 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on cp7008.magru.wmnet with reason: T376737 |
[production] |
13:27 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 4:00:00 on cp7008.magru.wmnet with reason: T376737 |
[production] |
13:27 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on cp7006.magru.wmnet with reason: T376737 |
[production] |
13:26 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 4:00:00 on cp7006.magru.wmnet with reason: T376737 |
[production] |
13:26 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 4:00:00 on cp7001.magru.wmnet with reason: T376737 |
[production] |
13:26 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 4:00:00 on cp7001.magru.wmnet with reason: T376737 |
[production] |
13:21 |
<cmooney@cumin1002> |
START - Cookbook sre.hosts.dhcp for host dns7001.wikimedia.org |
[production] |
13:20 |
<fabfur@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on lvs7003.magru.wmnet with reason: host reimage |
[production] |
13:18 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.downtime for 2:00:00 on lvs7003.magru.wmnet with reason: host reimage |
[production] |
13:15 |
<dcaro@cumin1002> |
END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host cloudcephmon1004.eqiad.wmnet with OS bullseye |
[production] |
13:11 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.reimage for host cp7015.magru.wmnet with OS bullseye |
[production] |
13:11 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'db1246 (re)pooling @ 100%: repool', diff saved to https://phabricator.wikimedia.org/P71185 and previous config saved to /var/cache/conftool/dbconfig/20241126-131120-arnaudb.json |
[production] |
13:07 |
<sukhe@cumin1002> |
END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host dns7001.wikimedia.org with OS bookworm |
[production] |
13:03 |
<sukhe@cumin1002> |
START - Cookbook sre.hosts.reimage for host dns7001.wikimedia.org with OS bookworm |
[production] |
12:58 |
<fabfur@cumin1002> |
START - Cookbook sre.hosts.reimage for host lvs7003.magru.wmnet with OS bullseye |
[production] |
12:57 |
<dcaro@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on cloudcephmon1004.eqiad.wmnet with reason: host reimage |
[production] |
12:56 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'db1246 (re)pooling @ 75%: repool', diff saved to https://phabricator.wikimedia.org/P71183 and previous config saved to /var/cache/conftool/dbconfig/20241126-125614-arnaudb.json |
[production] |