2024-05-24
ยง
|
12:16 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'fix wrong weight', diff saved to https://phabricator.wikimedia.org/P63085 and previous config saved to /var/cache/conftool/dbconfig/20240524-121641-arnaudb.json |
[production] |
12:16 |
<btullis@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/device-analytics: apply |
[production] |
12:16 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 12:00:00 on db1150.eqiad.wmnet with reason: Maintenance |
[production] |
12:16 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 12:00:00 on db1150.eqiad.wmnet with reason: Maintenance |
[production] |
12:15 |
<btullis@deploy1002> |
helmfile [eqiad] START helmfile.d/services/device-analytics: apply |
[production] |
12:15 |
<btullis@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/device-analytics: apply |
[production] |
12:15 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'db2176 (re)pooling @ 25%: post clone (src) repool', diff saved to https://phabricator.wikimedia.org/P63084 and previous config saved to /var/cache/conftool/dbconfig/20240524-121523-arnaudb.json |
[production] |
12:14 |
<btullis@deploy1002> |
helmfile [codfw] START helmfile.d/services/device-analytics: apply |
[production] |
12:08 |
<arnaudb@cumin1002> |
END (PASS) - Cookbook sre.mysql.clone (exit_code=0) of db2116.codfw.wmnet onto db2176.codfw.wmnet |
[production] |
11:53 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depooling db1201 (T364299)', diff saved to https://phabricator.wikimedia.org/P63083 and previous config saved to /var/cache/conftool/dbconfig/20240524-115351-marostegui.json |
[production] |
11:53 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db1201.eqiad.wmnet with reason: Maintenance |
[production] |
11:53 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 6:00:00 on db1201.eqiad.wmnet with reason: Maintenance |
[production] |
11:53 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1187 (T364299)', diff saved to https://phabricator.wikimedia.org/P63082 and previous config saved to /var/cache/conftool/dbconfig/20240524-115328-marostegui.json |
[production] |
11:44 |
<akosiaris> |
manually delete the 1 sessionstore pod running on parse1004 |
[production] |
11:38 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1187', diff saved to https://phabricator.wikimedia.org/P63081 and previous config saved to /var/cache/conftool/dbconfig/20240524-113820-marostegui.json |
[production] |
11:24 |
<btullis@deploy1002> |
helmfile [staging] DONE helmfile.d/services/device-analytics: apply |
[production] |
11:24 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/device-analytics: apply |
[production] |
11:23 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1187', diff saved to https://phabricator.wikimedia.org/P63080 and previous config saved to /var/cache/conftool/dbconfig/20240524-112310-marostegui.json |
[production] |
11:22 |
<btullis@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/media-analytics: apply |
[production] |
11:22 |
<btullis@deploy1002> |
helmfile [eqiad] START helmfile.d/services/media-analytics: apply |
[production] |
11:21 |
<btullis@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/media-analytics: apply |
[production] |
11:21 |
<btullis@deploy1002> |
helmfile [codfw] START helmfile.d/services/media-analytics: apply |
[production] |
11:21 |
<btullis@deploy1002> |
helmfile [staging] DONE helmfile.d/services/media-analytics: apply |
[production] |
11:20 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/media-analytics: apply |
[production] |
11:19 |
<btullis@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/page-analytics: apply |
[production] |
11:18 |
<btullis@deploy1002> |
helmfile [eqiad] START helmfile.d/services/page-analytics: apply |
[production] |
11:18 |
<btullis@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/page-analytics: apply |
[production] |
11:17 |
<btullis@deploy1002> |
helmfile [codfw] START helmfile.d/services/page-analytics: apply |
[production] |
11:15 |
<btullis@deploy1002> |
helmfile [staging] DONE helmfile.d/services/page-analytics: apply |
[production] |
11:15 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/page-analytics: apply |
[production] |
11:10 |
<btullis@deploy1002> |
helmfile [eqiad] DONE helmfile.d/services/geo-analytics: apply |
[production] |
11:10 |
<btullis@deploy1002> |
helmfile [eqiad] START helmfile.d/services/geo-analytics: apply |
[production] |
11:10 |
<btullis@deploy1002> |
helmfile [codfw] DONE helmfile.d/services/geo-analytics: apply |
[production] |
11:09 |
<btullis@deploy1002> |
helmfile [codfw] START helmfile.d/services/geo-analytics: apply |
[production] |
11:08 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1187 (T364299)', diff saved to https://phabricator.wikimedia.org/P63079 and previous config saved to /var/cache/conftool/dbconfig/20240524-110802-marostegui.json |
[production] |
11:07 |
<btullis@deploy1002> |
helmfile [staging] DONE helmfile.d/services/geo-analytics: apply |
[production] |
11:07 |
<btullis@deploy1002> |
helmfile [staging] START helmfile.d/services/geo-analytics: apply |
[production] |
11:06 |
<jelto@cumin1002> |
END (PASS) - Cookbook sre.gitlab.upgrade (exit_code=0) on GitLab host gitlab2002.wikimedia.org with reason: Upgrade GitLab to new version |
[production] |
10:56 |
<arnaudb@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3 days, 0:00:00 on db2150.codfw.wmnet with reason: reimage |
[production] |
10:55 |
<arnaudb@cumin1002> |
START - Cookbook sre.hosts.downtime for 3 days, 0:00:00 on db2150.codfw.wmnet with reason: reimage |
[production] |
10:49 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'Depool db2150, hardware issues ', diff saved to https://phabricator.wikimedia.org/P63078 and previous config saved to /var/cache/conftool/dbconfig/20240524-104953-arnaudb.json |
[production] |
10:27 |
<arnaudb@cumin1002> |
START - Cookbook sre.mysql.clone of db2116.codfw.wmnet onto db2176.codfw.wmnet |
[production] |
10:24 |
<arnaudb@cumin1002> |
dbctl commit (dc=all): 'Depool db2116 to clone on db2176 T365793', diff saved to https://phabricator.wikimedia.org/P63077 and previous config saved to /var/cache/conftool/dbconfig/20240524-102424-arnaudb.json |
[production] |
10:23 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Depooling db1187 (T364299)', diff saved to https://phabricator.wikimedia.org/P63076 and previous config saved to /var/cache/conftool/dbconfig/20240524-102340-marostegui.json |
[production] |
10:23 |
<marostegui@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 6:00:00 on db1187.eqiad.wmnet with reason: Maintenance |
[production] |
10:23 |
<marostegui@cumin1002> |
START - Cookbook sre.hosts.downtime for 6:00:00 on db1187.eqiad.wmnet with reason: Maintenance |
[production] |
10:23 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1180 (T364299)', diff saved to https://phabricator.wikimedia.org/P63075 and previous config saved to /var/cache/conftool/dbconfig/20240524-102315-marostegui.json |
[production] |
10:08 |
<marostegui@cumin1002> |
dbctl commit (dc=all): 'Repooling after maintenance db1180', diff saved to https://phabricator.wikimedia.org/P63074 and previous config saved to /var/cache/conftool/dbconfig/20240524-100807-marostegui.json |
[production] |
09:54 |
<arnaudb@cumin1002> |
END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 3 days, 0:00:00 on db2176.codfw.wmnet with reason: Host has issues |
[production] |
09:54 |
<arnaudb@cumin1002> |
START - Cookbook sre.hosts.downtime for 3 days, 0:00:00 on db2176.codfw.wmnet with reason: Host has issues |
[production] |