| 
      
        2024-11-18
      
      ยง
     | 
  
    
  | 13:03 | 
  <jelto@deploy2002> | 
  helmfile [staging] START helmfile.d/services/wikidata-query-gui: apply | 
  [production] | 
            
  | 13:01 | 
  <moritzm> | 
  removing ganeti1021 from active Ganeti nodes T378921 | 
  [production] | 
            
  | 12:56 | 
  <btullis@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on an-presto1018.eqiad.wmnet with reason: host reimage | 
  [production] | 
            
  | 12:54 | 
  <btullis@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2:00:00 on an-presto1018.eqiad.wmnet with reason: host reimage | 
  [production] | 
            
  | 12:39 | 
  <btullis@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host an-presto1018.eqiad.wmnet with OS bullseye | 
  [production] | 
            
  | 12:38 | 
  <btullis@cumin1002> | 
  END (ERROR) - Cookbook sre.hosts.reimage (exit_code=97) for host an-presto1018.eqiad.wmnet with OS bullseye | 
  [production] | 
            
  | 12:38 | 
  <cgoubert@cumin1002> | 
  END (PASS) - Cookbook sre.dns.netbox (exit_code=0) | 
  [production] | 
            
  | 12:37 | 
  <kart_> | 
  Updated recommendation api to 2024-11-13-183159-production (T379592, T379037) | 
  [production] | 
            
  | 12:36 | 
  <arnaudb@cumin1002> | 
  START - Cookbook sre.mysql.pool db2150 slowly with 10 steps - slow repool db2150 T380117 | 
  [production] | 
            
  | 12:36 | 
  <cgoubert@cumin1002> | 
  START - Cookbook sre.dns.netbox | 
  [production] | 
            
  | 12:24 | 
  <kartik@deploy2002> | 
  helmfile [ml-serve-codfw] 'sync' command on namespace 'recommendation-api-ng' for release 'main' . | 
  [production] | 
            
  | 12:22 | 
  <btullis@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host an-presto1018.eqiad.wmnet with OS bullseye | 
  [production] | 
            
  | 12:22 | 
  <kartik@deploy2002> | 
  helmfile [ml-serve-eqiad] 'sync' command on namespace 'recommendation-api-ng' for release 'main' . | 
  [production] | 
            
  | 12:21 | 
  <btullis@cumin1002> | 
  END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host an-presto1018.eqiad.wmnet with OS bullseye | 
  [production] | 
            
  | 12:19 | 
  <btullis@cumin1002> | 
  END (PASS) - Cookbook sre.druid.roll-restart-workers (exit_code=0) for Druid analytics cluster: Roll restart of Druid jvm daemons. | 
  [production] | 
            
  | 12:15 | 
  <stevemunene@deploy2002> | 
  helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/airflow-analytics-product: apply | 
  [production] | 
            
  | 12:14 | 
  <stevemunene@deploy2002> | 
  helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/airflow-analytics-product: apply | 
  [production] | 
            
  | 12:13 | 
  <fabfur@cumin1002> | 
  END (PASS) - Cookbook sre.cdn.roll-upgrade-haproxy (exit_code=0) rolling upgrade of HAProxy on A:cp-ulsfo | 
  [production] | 
            
  | 12:13 | 
  <kartik@deploy2002> | 
  helmfile [ml-staging-codfw] 'sync' command on namespace 'recommendation-api-ng' for release 'main' . | 
  [production] | 
            
  | 12:10 | 
  <elukey@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.provision (exit_code=0) for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 12:09 | 
  <stevemunene@deploy2002> | 
  helmfile [dse-k8s-eqiad] DONE helmfile.d/dse-k8s-services/airflow-analytics-product: apply | 
  [production] | 
            
  | 12:08 | 
  <btullis@cumin1002> | 
  START - Cookbook sre.hosts.reimage for host an-presto1018.eqiad.wmnet with OS bullseye | 
  [production] | 
            
  | 12:02 | 
  <stevemunene@deploy2002> | 
  helmfile [dse-k8s-eqiad] START helmfile.d/dse-k8s-services/airflow-analytics-product: apply | 
  [production] | 
            
  | 12:00 | 
  <stevemunene@deploy2002> | 
  helmfile [dse-k8s-eqiad] DONE helmfile.d/admin 'apply'. | 
  [production] | 
            
  | 11:59 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:59 | 
  <stevemunene@deploy2002> | 
  helmfile [dse-k8s-eqiad] START helmfile.d/admin 'apply'. | 
  [production] | 
            
  | 11:58 | 
  <elukey@cumin2002> | 
  END (PASS) - Cookbook sre.hosts.provision (exit_code=0) for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:58 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:47 | 
  <jmm@cumin2002> | 
  END (PASS) - Cookbook sre.ganeti.drain-node (exit_code=0) for draining ganeti node ganeti1021.eqiad.wmnet | 
  [production] | 
            
  | 11:45 | 
  <elukey@cumin1002> | 
  END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:45 | 
  <elukey@cumin1002> | 
  START - Cookbook sre.hosts.provision for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:41 | 
  <elukey@cumin2002> | 
  END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host thanos-be1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:41 | 
  <arnaudb@cumin1002> | 
  END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2 days, 0:00:00 on db2216.codfw.wmnet with reason: T380131 - table corruption | 
  [production] | 
            
  | 11:41 | 
  <arnaudb@cumin1002> | 
  START - Cookbook sre.hosts.downtime for 2 days, 0:00:00 on db2216.codfw.wmnet with reason: T380131 - table corruption | 
  [production] | 
            
  | 11:41 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host thanos-be1005.mgmt.eqiad.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:41 | 
  <urbanecm> | 
  mwmaint2002: Run `extensions/GrowthExperiments/maintenance/refreshLinkRecommendations.php` at `testwiki` for a bunch of pages (P71064 is list of commands executed; T378983) | 
  [production] | 
            
  | 11:33 | 
  <btullis@cumin1002> | 
  START - Cookbook sre.druid.roll-restart-workers for Druid analytics cluster: Roll restart of Druid jvm daemons. | 
  [production] | 
            
  | 11:25 | 
  <elukey@cumin2002> | 
  END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:25 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:21 | 
  <elukey@cumin2002> | 
  END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:16 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 11:14 | 
  <dcaro@cloudcumin1001> | 
  END (PASS) - Cookbook wmcs.toolforge.component.deploy (exit_code=0) for component jobs-emailer | 
  [tools] | 
            
  | 11:09 | 
  <dcaro@cloudcumin1001> | 
  START - Cookbook wmcs.toolforge.component.deploy for component jobs-emailer | 
  [tools] | 
            
  | 10:57 | 
  <dcaro@cloudcumin1001> | 
  END (PASS) - Cookbook wmcs.toolforge.component.deploy (exit_code=0) for component jobs-emailer | 
  [toolsbeta] | 
            
  | 10:53 | 
  <dcaro@cloudcumin1001> | 
  START - Cookbook wmcs.toolforge.component.deploy for component jobs-emailer | 
  [toolsbeta] | 
            
  | 10:50 | 
  <elukey@cumin2002> | 
  END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 10:50 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 10:50 | 
  <elukey@cumin2002> | 
  END (FAIL) - Cookbook sre.hosts.provision (exit_code=99) for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 10:49 | 
  <elukey@cumin2002> | 
  START - Cookbook sre.hosts.provision for host thanos-be2005.mgmt.codfw.wmnet with chassis set policy FORCE_RESTART | 
  [production] | 
            
  | 10:46 | 
  <dcausse@deploy2002> | 
  helmfile [eqiad] DONE helmfile.d/services/rdf-streaming-updater: apply | 
  [production] |