From 718e3098ec2cd9126b343d16ea780763aee7c662 Mon Sep 17 00:00:00 2001 From: DebakelOrakel <78408921+DebakelOrakel@users.noreply.github.com> Date: Tue, 16 Jan 2024 14:50:41 +0100 Subject: [PATCH] Include resolving steps in check_cephcluster_status partial (#153) Co-authored-by: Stephan Feurer --- .../ROOT/pages/runbooks/CephOSDFlapping.adoc | 27 ------------------- .../runbooks/check_cephcluster_status.adoc | 27 +++++++++++++++++++ 2 files changed, 27 insertions(+), 27 deletions(-) diff --git a/docs/modules/ROOT/pages/runbooks/CephOSDFlapping.adoc b/docs/modules/ROOT/pages/runbooks/CephOSDFlapping.adoc index 3e1d5cce..36d965ec 100644 --- a/docs/modules/ROOT/pages/runbooks/CephOSDFlapping.adoc +++ b/docs/modules/ROOT/pages/runbooks/CephOSDFlapping.adoc @@ -32,33 +32,6 @@ In particular, check whether section `State` for container `osd` has a note that include::partial$runbooks/check_cephcluster_status.adoc[] -==== Check Ceph crash logs - -[source,console] ----- -$ ceph_cluster_ns=syn-rook-ceph-cluster -$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- ceph crash ls <1> -[ ... list of crash logs ... ] -$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- \ - ceph crash info <2> -[ ... detailed crash info ... ] ----- -<1> List currently not archived crash logs -<2> Show detailed information of crash log with id `` - -==== Archive Ceph crash logs - -[source,console] ----- -$ ceph_cluster_ns=syn-rook-ceph-cluster -$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- \ - ceph crash archive-all <1> -$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- \ - ceph crash archive <2> ----- -<1> Archive all currently not archived crash logs -<2> Archive crash log with id `` - == icon:book[] Upstream documentation https://docs.ceph.com/en/latest/rados/troubleshooting/troubleshooting-osd#flapping-osds diff --git a/docs/modules/ROOT/partials/runbooks/check_cephcluster_status.adoc b/docs/modules/ROOT/partials/runbooks/check_cephcluster_status.adoc index 9388b7b5..e636d376 100644 --- a/docs/modules/ROOT/partials/runbooks/check_cephcluster_status.adoc +++ b/docs/modules/ROOT/partials/runbooks/check_cephcluster_status.adoc @@ -17,3 +17,30 @@ $ kubectl -n ${ceph_cluster_ns} exec -it deploy/rook-ceph-tools -- ceph status <1> General cluster health status <2> One or more lines of information giving details why the cluster state is degraded. Only available if the cluster health isn't `HEALTH_OK`. + +==== Check Ceph crash logs + +[source,console] +---- +$ ceph_cluster_ns=syn-rook-ceph-cluster +$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- ceph crash ls <1> +[ ... list of crash logs ... ] +$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- \ + ceph crash info <2> +[ ... detailed crash info ... ] +---- +<1> List currently not archived crash logs +<2> Show detailed information of crash log with id `` + +==== Archive Ceph crash logs + +[source,console] +---- +$ ceph_cluster_ns=syn-rook-ceph-cluster +$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- \ + ceph crash archive-all <1> +$ kubectl -n "${ceph_cluster_ns}" exec -it deploy/rook-ceph-tools -- \ + ceph crash archive <2> +---- +<1> Archive all currently not archived crash logs +<2> Archive crash log with id ``