| 
      
        2024-09-06
      
      ยง
     | 
  
    
  | 15:23 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host sretest2001.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 15:22 | 
  <kamila@cumin1002> | 
  START - Cookbook sre.network.configure-switch-interfaces for host wikikube-worker2103 | 
  [production] | 
            
  | 15:22 | 
  <kamila@cumin1002> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 15:22 | 
  <kamila@cumin1002> | 
  END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2430 to wikikube-worker2103 - kamila@cumin1002" | 
  [production] | 
            
  | 15:19 | 
  <kamila@cumin1002> | 
  START - Cookbook sre.puppet.sync-netbox-hiera generate netbox hiera data: "Triggered by cookbooks.sre.dns.netbox: Renaming mw2430 to wikikube-worker2103 - kamila@cumin1002" | 
  [production] | 
            
  | 15:16 | 
  <kamila@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 15:15 | 
  <kamila@cumin1002> | 
  START - Cookbook sre.hosts.rename from mw2430 to wikikube-worker2103 | 
  [production] | 
            
  | 15:14 | 
  <topranks> | 
  disabling PyBal on lvs1017 to shift traffic to lvs1020 and allow work to fix faulty fibre link T374247 | 
  [production] | 
            
  | 15:13 | 
  <cmooney@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on lvs1017.eqiad.wmnet with reason: Move traffic off lvs1017 to lvs1020 to troubleshooot faulty link | 
  [production] | 
            
  | 15:13 | 
  <cmooney@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on lvs1017.eqiad.wmnet with reason: Move traffic off lvs1017 to lvs1020 to troubleshooot faulty link | 
  [production] | 
            
  | 15:07 | 
  <kamila@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host mw2430.codfw.wmnet | 
  [production] | 
            
  | 15:07 | 
  <kamila@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node depool for host mw2430.codfw.wmnet | 
  [production] | 
            
  | 15:02 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.renumber-node (exit_code=0) Renumbering for host wikikube-worker2098.codfw.wmnet | 
  [production] | 
            
  | 15:02 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host wikikube-worker2098.codfw.wmnet | 
  [production] | 
            
  | 15:02 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2098.codfw.wmnet | 
  [production] | 
            
  | 14:52 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host wikikube-worker2098.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 14:51 | 
  <btullis@cumin1002> | 
  END (PASS) - Cookbook sre.wikireplicas.add-wiki (exit_code=0) for database bdrwiki (T371759) | 
  [production] | 
            
  | 14:44 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host wikikube-worker2095.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 14:42 | 
  <hnowlan@cumin1002> | 
  END (FAIL) - Cookbook sre.k8s.renumber-node (exit_code=99) Renumbering for host wikikube-worker2095.codfw.wmnet | 
  [production] | 
            
  | 14:42 | 
  <hnowlan@cumin1002> | 
  END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host wikikube-worker2095.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 14:42 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host wikikube-worker2095.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 14:42 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.k8s.renumber-node Renumbering for host wikikube-worker2095.codfw.wmnet | 
  [production] | 
            
  | 14:41 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host kubestage2001.codfw.wmnet with OS bookworm | 
  [production] | 
            
  | 14:28 | 
  <akosiaris> | 
  repool kubernetes1059 T365993 | 
  [production] | 
            
  | 14:28 | 
  <akosiaris@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host kubernetes1059.eqiad.wmnet | 
  [production] | 
            
  | 14:27 | 
  <akosiaris@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host kubernetes1059.eqiad.wmnet | 
  [production] | 
            
  | 14:25 | 
  <btullis@cumin1002> | 
  START - Cookbook sre.wikireplicas.add-wiki for database bdrwiki (T371759) | 
  [production] | 
            
  | 14:23 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on kubestage2001.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 14:20 | 
  <jayme@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on kubestage2001.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 14:17 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.renumber-node (exit_code=0) Renumbering for host wikikube-worker2102.codfw.wmnet | 
  [production] | 
            
  | 14:17 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host wikikube-worker2102.codfw.wmnet | 
  [production] | 
            
  | 14:17 | 
  <jayme@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2102.codfw.wmnet | 
  [production] | 
            
  | 14:13 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host wikikube-worker2102.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 14:10 | 
  <akosiaris> | 
  restart pybal on lvs1019 | 
  [production] | 
            
  | 14:07 | 
  <akosiaris> | 
  silence alerts based on alertname=PHPFPMTooBusy,deployment=mw-wikifunctions,site=codfw T374241 | 
  [production] | 
            
  | 13:59 | 
  <jayme@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host kubestage2001.codfw.wmnet with OS bookworm | 
  [production] | 
            
  | 13:58 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host kubestage2001.codfw.wmnet | 
  [production] | 
            
  | 13:58 | 
  <jayme@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node depool for host kubestage2001.codfw.wmnet | 
  [production] | 
            
  | 13:56 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.renumber-node (exit_code=0) Renumbering for host kubestage2001.codfw.wmnet | 
  [production] | 
            
  | 13:56 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host kubestage2001.codfw.wmnet | 
  [production] | 
            
  | 13:56 | 
  <jayme@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host kubestage2001.codfw.wmnet | 
  [production] | 
            
  | 13:52 | 
  <btullis@cumin1002> | 
  END (FAIL) - Cookbook sre.wikireplicas.add-wiki (exit_code=99) for database bdrwiki (T371759) | 
  [production] | 
            
  | 13:52 | 
  <jayme> | 
  homer lsw1-a6-codfw* commit 'T372878' | 
  [production] | 
            
  | 13:51 | 
  <btullis@cumin1002> | 
  START - Cookbook sre.wikireplicas.add-wiki for database bdrwiki (T371759) | 
  [production] | 
            
  | 13:48 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on wikikube-worker2102.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 13:46 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host ganeti-test2003.codfw.wmnet | 
  [production] | 
            
  | 13:44 | 
  <jayme@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on wikikube-worker2102.codfw.wmnet with reason: host reimage | 
  [production] | 
            
  | 13:36 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host kubestage2001.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 13:32 | 
  <cgoubert@cumin1002> | 
  END (FAIL) - Cookbook sre.k8s.renumber-node (exit_code=1) Renumbering for host wikikube-worker2101.codfw.wmnet | 
  [production] | 
            
  | 13:32 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host wikikube-worker2101.codfw.wmnet | 
  [production] |