| 
      
        2024-09-05
      
      ยง
     | 
  
    
  | 11:29 | 
  <jayme@deploy1003> | 
  helmfile [codfw] START helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 11:29 | 
  <jayme@deploy1003> | 
  helmfile [codfw] DONE helmfile.d/services/eventgate-analytics-external: apply | 
  [production] | 
            
  | 11:29 | 
  <jayme@deploy1003> | 
  helmfile [codfw] START helmfile.d/services/eventgate-analytics-external: apply | 
  [production] | 
            
  | 11:28 | 
  <jayme@deploy1003> | 
  helmfile [codfw] DONE helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 11:28 | 
  <ladsgroup@cumin2002> | 
  dbctl commit (dc=all): 'Promote db2214 to s6 primary T374087', diff saved to https://phabricator.wikimedia.org/P68689 and previous config saved to /var/cache/conftool/dbconfig/20240905-112846-ladsgroup.json | 
  [production] | 
            
  | 11:28 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.hosts.reboot-single for host etherpad2002.codfw.wmnet | 
  [production] | 
            
  | 11:28 | 
  <jayme@deploy1003> | 
  helmfile [codfw] START helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 11:27 | 
  <Amir1> | 
  Starting s6 codfw failover from db2129 to db2214 - T374087 | 
  [production] | 
            
  | 11:27 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.hosts.move-vlan for host wikikube-worker2029 | 
  [production] | 
            
  | 11:26 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host wikikube-worker2029.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 11:26 | 
  <jayme@deploy1003> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 11:25 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) depool for host wikikube-worker2029.codfw.wmnet | 
  [production] | 
            
  | 11:25 | 
  <jayme@deploy1003> | 
  helmfile [staging] START helmfile.d/services/eventgate-logging-external: apply | 
  [production] | 
            
  | 11:25 | 
  <jayme@deploy1003> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-analytics-external: apply | 
  [production] | 
            
  | 11:25 | 
  <jayme@deploy1003> | 
  helmfile [staging] START helmfile.d/services/eventgate-analytics-external: apply | 
  [production] | 
            
  | 11:25 | 
  <jayme@deploy1003> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 11:25 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node depool for host wikikube-worker2029.codfw.wmnet | 
  [production] | 
            
  | 11:25 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.k8s.renumber-node Renumbering for host wikikube-worker2029.codfw.wmnet | 
  [production] | 
            
  | 11:24 | 
  <jayme@deploy1003> | 
  helmfile [staging] START helmfile.d/services/eventgate-analytics: apply | 
  [production] | 
            
  | 11:23 | 
  <jayme@deploy1003> | 
  helmfile [codfw] DONE helmfile.d/services/eventgate-main: apply | 
  [production] | 
            
  | 11:23 | 
  <jayme@deploy1003> | 
  helmfile [codfw] START helmfile.d/services/eventgate-main: apply | 
  [production] | 
            
  | 11:22 | 
  <jayme@deploy1003> | 
  helmfile [staging] DONE helmfile.d/services/eventgate-main: apply | 
  [production] | 
            
  | 11:22 | 
  <jayme@deploy1003> | 
  helmfile [staging] START helmfile.d/services/eventgate-main: apply | 
  [production] | 
            
  | 11:22 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.renumber-node (exit_code=0) Renumbering for host wikikube-worker2090.codfw.wmnet | 
  [production] | 
            
  | 11:22 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host wikikube-worker2090.codfw.wmnet | 
  [production] | 
            
  | 11:22 | 
  <jayme@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2090.codfw.wmnet | 
  [production] | 
            
  | 11:21 | 
  <jayme> | 
  homer cr*codfw* commit 'T372878' | 
  [production] | 
            
  | 11:21 | 
  <ladsgroup@cumin2002> | 
  dbctl commit (dc=all): 'Set db2214 with weight 0 T374087', diff saved to https://phabricator.wikimedia.org/P68688 and previous config saved to /var/cache/conftool/dbconfig/20240905-112121-ladsgroup.json | 
  [production] | 
            
  | 11:20 | 
  <jelto@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reboot-single (exit_code=0) for host etherpad2002.codfw.wmnet | 
  [production] | 
            
  | 11:20 | 
  <ladsgroup@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 1:00:00 on 24 hosts with reason: Primary switchover s6 T374087 | 
  [production] | 
            
  | 11:19 | 
  <ladsgroup@cumin2002> | 
  START - Cookbook sre.hosts.downtime for 1:00:00 on 24 hosts with reason: Primary switchover s6 T374087 | 
  [production] | 
            
  | 11:19 | 
  <jayme@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host wikikube-worker2090.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 11:19 | 
  <jiji@deploy1003> | 
  helmfile [codfw] DONE helmfile.d/services/mw-mcrouter: apply | 
  [production] | 
            
  | 11:17 | 
  <jelto@cumin1002> | 
  START - Cookbook sre.hosts.reboot-single for host etherpad2002.codfw.wmnet | 
  [production] | 
            
  | 11:09 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.misc-clusters.roll-restart-reboot-eventschemas (exit_code=0) rolling restart_daemons on A:schema-eqiad | 
  [production] | 
            
  | 11:08 | 
  <jmm@cumin2002> | 
  START - Cookbook sre.misc-clusters.roll-restart-reboot-eventschemas rolling restart_daemons on A:schema-eqiad | 
  [production] | 
            
  | 11:05 | 
  <jiji@deploy1003> | 
  helmfile [codfw] START helmfile.d/services/mw-mcrouter: apply | 
  [production] | 
            
  | 11:00 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.renumber-node (exit_code=0) Renumbering for host wikikube-worker2084.codfw.wmnet | 
  [production] | 
            
  | 11:00 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.k8s.pool-depool-node (exit_code=0) pool for host wikikube-worker2084.codfw.wmnet | 
  [production] | 
            
  | 11:00 | 
  <hnowlan@cumin1002> | 
  START - Cookbook sre.k8s.pool-depool-node pool for host wikikube-worker2084.codfw.wmnet | 
  [production] | 
            
  | 10:58 | 
  <hnowlan> | 
  homer lsw1-b3-codfw* commit | 
  [production] | 
            
  | 10:57 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host wikikube-worker2084.codfw.wmnet with OS bullseye | 
  [production] | 
            
  | 10:51 | 
  <sfaci@deploy1003> | 
  helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/mpic-next: apply | 
  [production] | 
            
  | 10:51 | 
  <sfaci@deploy1003> | 
  helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/mpic-next: apply | 
  [production] | 
            
  | 10:50 | 
  <aborrero@cloudcumin1001> | 
  END (PASS) - Cookbook wmcs.openstack.tofu (exit_code=0) running tofu plan+apply for main branch | 
  [admin] | 
            
  | 10:49 | 
  <aborrero@cloudcumin1001> | 
  START - Cookbook wmcs.openstack.tofu running tofu plan+apply for main branch | 
  [admin] | 
            
  | 10:43 | 
  <aborrero@cloudcumin1001> | 
  END (PASS) - Cookbook wmcs.openstack.tofu (exit_code=0) running tofu plan for https://gitlab.wikimedia.org/repos/cloud/cloud-vps/tofu-infra/-/merge_requests/36 | 
  [admin] | 
            
  | 10:43 | 
  <aborrero@cloudcumin1001> | 
  START - Cookbook wmcs.openstack.tofu running tofu plan for https://gitlab.wikimedia.org/repos/cloud/cloud-vps/tofu-infra/-/merge_requests/36 | 
  [admin] | 
            
  | 10:42 | 
  <vgutierrez@cumin1002> | 
  END (PASS) - Cookbook sre.cdn.roll-upgrade-ats (exit_code=0) Rolling upgrade/restart of Apache Traffic Server on A:cp-text_esams for 9.2.5-1wm2 | 
  [production] | 
            
  | 10:38 | 
  <hnowlan@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on wikikube-worker2084.codfw.wmnet with reason: host reimage | 
  [production] |