2021-10-18
§
|
15:17 |
<joal> |
Rerun failed instances from cassandra-hourly-coord-local_group_default_T_pageviews_per_project_v2 |
[analytics] |
14:49 |
<elukey> |
restart hadoop-yarn-nodemanager on an-worker1119 and an-worker1103 (Java OOM in the logs) |
[analytics] |
12:09 |
<btullis> |
root@aqs1013:/srv/cassandra-b/tmp# systemctl restart cassandra-b.service |
[analytics] |
12:09 |
<btullis> |
root@aqs1012:/srv/cassandra-b/tmp# systemctl restart cassandra-b.service |
[analytics] |
09:25 |
<btullis> |
btullis@cumin1001:~$ sudo transfer.py aqs1013.eqiad.wmnet:/srv/cassandra-b/tmp/local_group_default_T_pageviews_per_article_flat an-presto1001.eqiad.wmnet:/srv/cassandra_migration/aqs1013-b/ |
[analytics] |
09:17 |
<btullis> |
btullis@cumin1001:~$ sudo transfer.py aqs1012.eqiad.wmnet:/srv/cassandra-b/tmp/local_group_default_T_pageviews_per_article_flat an-presto1001.eqiad.wmnet:/srv/cassandra_migration/aqs1012-b/ |
[analytics] |
09:16 |
<btullis> |
btullis@cumin1001:~$ sudo transfer.py aqs1012.eqiad.wmnet:/srv/cassandra-b/tmp/local_group_default_T_pageviews_per_article_flat an-presto1001.eqiad.wmnet:/srv/cassandra_migration/cassandra_migration/aqs1012-b/ |
[analytics] |
2021-09-24
§
|
22:33 |
<razzi> |
restart an-test-coord presto coordinator service to experiment withweb-ui.authentication.type=fixed |
[analytics] |
15:06 |
<btullis> |
btullis@cumin1001:~$ sudo cumin --mode async 'aqs100[4,7].eqiad.wmnet' 'nodetool-a snapshot -t T291469' 'nodetool-b snapshot -t T291469' |
[analytics] |
14:47 |
<btullis> |
btullis@aqs1007:~$ sudo nodetool-a repair --full local_group_default_T_mediarequest_per_file data |
[analytics] |
11:02 |
<btullis> |
btullis@an-master1001:~$ sudo systemctl restart hadoop-mapreduce-historyserver |
[analytics] |
10:47 |
<btullis> |
btullis@an-master1002:~$ sudo systemctl restart hadoop-hdfs-namenode |
[analytics] |
10:47 |
<btullis> |
btullis@an-master1002:~$ sudo systemctl restart hadoop-hdfs-zkfc |
[analytics] |
10:35 |
<btullis> |
btullis@an-master1001:~$ sudo -u hdfs kerberos-run-command hdfs /usr/bin/hdfs haadmin -failover an-master1002-eqiad-wmnet an-master1001-eqiad-wmnet |
[analytics] |
10:07 |
<btullis> |
btullis@an-launcher1002:~$ sudo -u analytics kerberos-run-command analytics /usr/local/bin/refine_eventlogging_legacy --ignore_failure_flag=true --table_include_regex='centralnoticeimpression' --since='2021-09-23T04:00:00.000Z' --until='2021-09-24T05:00:00.000Z' |
[analytics] |