production SAL

1251-1300 of 10000 results (76ms)

2023-03-07 §
14:43	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:42	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:42	<cmooney@cumin1001>	START - Cookbook sre.hosts.remove-downtime for 238 hosts	[production]
14:42	<cmooney@cumin1001>	END (PASS) - Cookbook sre.hosts.remove-downtime (exit_code=0) for mr1-eqiad	[production]
14:42	<cmooney@cumin1001>	START - Cookbook sre.hosts.remove-downtime for mr1-eqiad	[production]
14:41	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:41	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:41	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:41	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:40	<moritzm>	enabling Puppet in eqiad/esams/drmrs after completed Switch maintenance T329073	[production]
14:40	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:40	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'sync'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'sync'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:38	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:36	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:29	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:26	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:26	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:25	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:25	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:24	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:24	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:21	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:21	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:21	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:20	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:20	<topranks>	issuing reboot to upgrade asw2-a-eqiad virtual-chassis to Junos 21.4	[production]
14:20	<akosiaris@deploy1002>	helmfile [eqiad] DONE helmfile.d/admin 'apply'.	[production]
14:19	<akosiaris@deploy1002>	helmfile [eqiad] START helmfile.d/admin 'apply'.	[production]
14:19	<cmjohnson@cumin1001>	END (PASS) - Cookbook sre.hardware.upgrade-firmware (exit_code=0) upgrade firmware for hosts ['cloudcephosd1038']	[production]
14:17	<akosiaris@cumin1001>	END (FAIL) - Cookbook sre.hosts.reimage (exit_code=99) for host kubernetes1020.eqiad.wmnet with OS bullseye	[production]
14:16	<cmooney@cumin1001>	END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on mr1-eqiad with reason: eqiad row A upgrade	[production]
14:16	<cmooney@cumin1001>	START - Cookbook sre.hosts.downtime for 2:00:00 on mr1-eqiad with reason: eqiad row A upgrade	[production]
14:15	<cmjohnson@cumin1001>	END (PASS) - Cookbook sre.hardware.upgrade-firmware (exit_code=0) upgrade firmware for hosts ['cloudcephosd1037']	[production]
14:13	<akosiaris>	kubectl cordon kubernetes{1005,1007,1008,1017,1018}.eqiad.wmnet T329073	[production]
14:13	<mvernon@cumin1001>	END (PASS) - Cookbook sre.hosts.reimage (exit_code=0) for host ms-be2070.codfw.wmnet with OS bullseye	[production]
14:12	<mvernon@cumin1001>	END (PASS) - Cookbook sre.puppet.sync-netbox-hiera (exit_code=0) generate netbox hiera data: "Triggered by cookbooks.sre.hosts.reimage: Host reimage - mvernon@cumin1001"	[production]
14:09	<cmjohnson@cumin1001>	START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudcephosd1038']	[production]
14:09	<cmooney@cumin1001>	END (PASS) - Cookbook sre.hosts.downtime (exit_code=0) for 2:00:00 on 238 hosts with reason: eqiad row A upgrade	[production]
14:09	<cmjohnson@cumin1001>	END (FAIL) - Cookbook sre.hardware.upgrade-firmware (exit_code=99) upgrade firmware for hosts ['cloudcephosd1038']	[production]
14:09	<cmjohnson@cumin1001>	START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudcephosd1038']	[production]
14:08	<akosiaris@cumin1001>	END (FAIL) - Cookbook sre.hosts.downtime (exit_code=99) for 2:00:00 on kubernetes1020.eqiad.wmnet with reason: host reimage	[production]
14:08	<akosiaris@cumin1001>	START - Cookbook sre.hosts.downtime for 2:00:00 on kubernetes1020.eqiad.wmnet with reason: host reimage	[production]
14:07	<cmjohnson@cumin1001>	START - Cookbook sre.hardware.upgrade-firmware upgrade firmware for hosts ['cloudcephosd1037']	[production]