| 
      
        2024-09-09
      
      ยง
     | 
  
    
  | 16:09 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2095.codfw.wmnet | 
  [production] | 
            
  | 16:05 | 
  <hnowlan> | 
  homer lsw1-b5-codfw* commit | 
  [production] | 
            
  | 16:05 | 
  <aqu@deploy1003> | 
  Finished deploy [airflow-dags/analytics_test@5315c8d]: Test Refine through Airflow (duration: 00m 10s) | 
  [production] | 
            
  | 16:04 | 
  <aqu@deploy1003> | 
  Started deploy [airflow-dags/analytics_test@5315c8d]: Test Refine through Airflow | 
  [production] | 
            
  | 16:04 | 
  <claime> | 
  homer lsw1-b6-codfw* commit 'T372878' | 
  [production] | 
            
  | 16:03 | 
  <claime> | 
  homer cr*codfw* commit 'T372878' | 
  [production] | 
            
  | 16:01 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host wikikube-worker2105.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 15:53 | 
  <cmooney@cumin1002> | 
  END (PASS) - Cookbook sre.deploy.python-code (exit_code=0) homer to cumin2002.codfw.wmnet,cumin1002.eqiad.wmnet with reason: Release v0.7.0 plugin update for cephosd bgp - cmooney@cumin1002 | 
  [production] | 
            
  | 15:48 | 
  <hnowlan@cumin1002> | 
  END (ERROR) - Cookbook sre.k8s.pool-depool-node (exit_code=97) pool for host wikikube-worker2095.codfw.wmnet | 
  [production] | 
            
  | 15:48 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2095.codfw.wmnet | 
  [production] | 
            
  | 15:47 | 
  <cmooney@cumin1002> | 
  START - Cookbook sre.deploy.python-code homer to cumin2002.codfw.wmnet,cumin1002.eqiad.wmnet with reason: Release v0.7.0 plugin update for cephosd bgp - cmooney@cumin1002 | 
  [production] | 
            
  | 15:46 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host wikikube-worker2095.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 15:45 | 
  <aborrero@cloudcumin1001> | 
  END (PASS) - Cookbook wmcs.openstack.tofu (exit_code=0) running tofu plan+apply for main branch | 
  [admin] | 
            
  | 15:44 | 
  <aborrero@cloudcumin1001> | 
  START - Cookbook wmcs.openstack.tofu running tofu plan+apply for main branch | 
  [admin] | 
            
  | 15:44 | 
  <aborrero@cloudcumin1001> | 
  END (FAIL) - Cookbook wmcs.openstack.tofu (exit_code=99) running tofu plan+apply for main branch | 
  [admin] | 
            
  | 15:44 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on wikikube-worker2106.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:41 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on wikikube-worker2105.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:41 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on wikikube-worker2106.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:41 | 
  <elukey@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host sretest2001.codfw.wmnet with OS bookworm | 
  [production] | 
            
  | 15:40 | 
  <cmooney@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for asw2-d-eqiad | 
  [production] | 
            
  | 15:40 | 
  <cmooney@cumin1002> | 
  START - Cookbook sre.hosts.remove-downtime for asw2-d-eqiad | 
  [production] | 
            
  | 15:37 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on wikikube-worker2105.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:37 | 
  <aborrero@cloudcumin1001> | 
  START - Cookbook wmcs.openstack.tofu running tofu plan+apply for main branch | 
  [admin] | 
            
  | 15:32 | 
  <sukhe> | 
  restart bird on durum1001 | 
  [production] | 
            
  | 15:27 | 
  <cmooney@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on asw2-d-eqiad with reason: repalce vcp link from d2 port 51 to d4 port 52 | 
  [production] | 
            
  | 15:27 | 
  <cmooney@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 1:00:00 on asw2-d-eqiad with reason: repalce vcp link from d2 port 51 to d4 port 52 | 
  [production] | 
            
  | 15:26 | 
  <hnowlan@cumin1002> | 
  END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) for 2:00:00 on wikikube-worker2095.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:26 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on wikikube-worker2095.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 15:24 | 
  <aborrero@cloudcumin1001> | 
  END (PASS) - Cookbook wmcs.openstack.tofu (exit_code=0) running tofu plan for https://gitlab.wikimedia.org/repos/cloud/cloud-vps/tofu-infra/-/merge_requests/39 | 
  [admin] | 
            
  | 15:23 | 
  <aborrero@cloudcumin1001> | 
  START - Cookbook wmcs.openstack.tofu running tofu plan for https://gitlab.wikimedia.org/repos/cloud/cloud-vps/tofu-infra/-/merge_requests/39 | 
  [admin] | 
            
  | 15:09 | 
  <moritzm> | 
  installing imagemagick security updates | 
  [production] | 
            
  | 15:08 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host wikikube-worker2095.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 15:05 | 
  <dcaro@cloudcumin1001> | 
  START - Cookbook wmcs.ceph.osd.drain_node (T373986) | 
  [admin] | 
            
  | 15:04 | 
  <dcaro@cloudcumin1001> | 
  END (PASS) - Cookbook wmcs.ceph.osd.drain_node (exit_code=0) (T373986) | 
  [admin] | 
            
  | 14:55 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.move-vlan (exit_code=0) for host wikikube-worker2106 | 
  [production] | 
            
  | 14:55 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.network.configure-switch-interfaces (exit_code=0) for host wikikube-worker2106 | 
  [production] | 
            
  | 14:54 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2106 | 
  [production] | 
            
  | 14:54 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.dns.wipe-cache (exit_code=0) wikikube-worker2106.codfw.wmnet 57.16.192.10.in-addr.arpa 7.5.0.0.6.1.0.0.2.9.1.0.0.1.0.0.2.0.1.0.0.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors | 
  [production] | 
            
  | 14:54 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.dns.wipe-cache wikikube-worker2106.codfw.wmnet 57.16.192.10.in-addr.arpa 7.5.0.0.6.1.0.0.2.9.1.0.0.1.0.0.2.0.1.0.0.6.8.0.0.0.0.0.0.2.6.2.ip6.arpa on all recursors | 
  [production] | 
            
  | 14:54 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 14:54 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Update records for host wikikube-worker2106 - cgoubert@cumin1002" | 
  [production] | 
            
  | 14:54 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Update records for host wikikube-worker2106 - cgoubert@cumin1002" | 
  [production] | 
            
  | 14:53 | 
  <hnowlan@deploy1003> | 
  helmfile [eqiad] DONE helmfile.d/services/rest-gateway: apply | 
  [production] | 
            
  | 14:53 | 
  <hnowlan@deploy1003> | 
  helmfile [eqiad] START helmfile.d/services/rest-gateway: apply | 
  [production] | 
            
  | 14:53 | 
  <hnowlan@deploy1003> | 
  helmfile [codfw] DONE helmfile.d/services/rest-gateway: apply | 
  [production] | 
            
  | 14:53 | 
  <hnowlan@deploy1003> | 
  helmfile [codfw] START helmfile.d/services/rest-gateway: apply | 
  [production] | 
            
  | 14:51 | 
  <hnowlan@deploy1003> | 
  helmfile [staging] DONE helmfile.d/services/rest-gateway: apply | 
  [production] | 
            
  | 14:51 | 
  <ladsgroup@cumin1002> | 
  dbctl commit (dc=all): 'Repooling after maintenance db2140 (T371742)', diff saved to https://phabricator.wikimedia.org/P68759 and previous config saved to /var/cache/conftool/dbconfig/20240909-145145-ladsgroup.json | 
  [production] | 
            
  | 14:51 | 
  <hnowlan@deploy1003> | 
  helmfile [staging] START helmfile.d/services/rest-gateway: apply | 
  [production] | 
            
  | 14:51 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] |