- Kuberay operator logs:
kubectl logs $KUBERAY_OPERATOR_POD -n $YOUR_NAMESPACE | tee operator-log
{"level":"info","ts":"2024-04-20T01:11:24.753Z","logger":"setup","msg":"Flag watchNamespace is not set. Watch custom resources in all namespaces."}
{"level":"info","ts":"2024-04-20T01:11:24.753Z","logger":"setup","msg":"Setup manager"}
{"level":"info","ts":"2024-04-20T01:11:24.861Z","logger":"setup","msg":"starting manager"}
{"level":"info","ts":"2024-04-20T01:11:24.861Z","logger":"controller-runtime.metrics","msg":"Starting metrics server"}
{"level":"info","ts":"2024-04-20T01:11:24.861Z","logger":"controller-runtime.metrics","msg":"Serving metrics server","bindAddress":":8080","secure":false}
{"level":"info","ts":"2024-04-20T01:11:24.861Z","msg":"starting server","kind":"health probe","addr":"[::]:8082"}
I0420 01:11:27.650475 1 leaderelection.go:250] attempting to acquire leader lease rubrik-spark/ray-operator-leader...
I0420 01:11:43.072466 1 leaderelection.go:260] successfully acquired lease rubrik-spark/ray-operator-leader
{"level":"info","ts":"2024-04-20T01:11:43.073Z","logger":"controllers.RayCluster","msg":"Starting EventSource","source":"kind source: *v1.RayCluster"}
{"level":"info","ts":"2024-04-20T01:11:43.073Z","logger":"controllers.RayCluster","msg":"Starting EventSource","source":"kind source: *v1.Pod"}
{"level":"info","ts":"2024-04-20T01:11:43.073Z","logger":"controllers.RayCluster","msg":"Starting EventSource","source":"kind source: *v1.Service"}
{"level":"info","ts":"2024-04-20T01:11:43.073Z","logger":"controllers.RayCluster","msg":"Starting Controller"}
{"level":"info","ts":"2024-04-20T01:11:43.073Z","logger":"controllers.RayJob","msg":"Starting EventSource","source":"kind source: *v1.RayJob"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayJob","msg":"Starting EventSource","source":"kind source: *v1.RayCluster"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayJob","msg":"Starting EventSource","source":"kind source: *v1.Service"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayJob","msg":"Starting EventSource","source":"kind source: *v1.Job"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayJob","msg":"Starting Controller"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayService","msg":"Starting EventSource","source":"kind source: *v1.RayService"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayService","msg":"Starting EventSource","source":"kind source: *v1.RayCluster"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayService","msg":"Starting EventSource","source":"kind source: *v1.Service"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayService","msg":"Starting EventSource","source":"kind source: *v1.Ingress"}
{"level":"info","ts":"2024-04-20T01:11:43.074Z","logger":"controllers.RayService","msg":"Starting Controller"}
{"level":"info","ts":"2024-04-20T01:11:43.975Z","logger":"controllers.RayCluster","msg":"Starting workers","worker count":1}
{"level":"info","ts":"2024-04-20T01:11:43.980Z","logger":"controllers.RayService","msg":"Starting workers","worker count":1}
{"level":"info","ts":"2024-04-20T01:11:44.051Z","logger":"controllers.RayJob","msg":"Starting workers","worker count":1}
{"level":"info","ts":"2024-04-20T01:14:13.968Z","logger":"controllers.RayService","msg":"No active Ray cluster. RayService operator should prepare a new Ray cluster.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"a7afdd7c-47d2-4012-be34-18a62df2936f"}
{"level":"info","ts":"2024-04-20T01:14:13.968Z","logger":"controllers.RayService","msg":"Current cluster is unhealthy, prepare to restart.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"a7afdd7c-47d2-4012-be34-18a62df2936f","Status":{"activeServiceStatus":{"rayClusterStatus":{"desiredCPU":"0","desiredMemory":"0","desiredGPU":"0","desiredTPU":"0","head":{}}},"pendingServiceStatus":{"rayClusterStatus":{"desiredCPU":"0","desiredMemory":"0","desiredGPU":"0","desiredTPU":"0","head":{}}},"observedGeneration":1}}
{"level":"info","ts":"2024-04-20T01:14:13.986Z","logger":"KubeAPIWarningLogger","msg":"unknown field \"spec.rayClusterConfig.headGroupSpec.template.metadata.creationTimestamp\""}
{"level":"info","ts":"2024-04-20T01:14:13.986Z","logger":"KubeAPIWarningLogger","msg":"unknown field \"spec.rayClusterConfig.workerGroupSpecs[0].template.metadata.creationTimestamp\""}
{"level":"info","ts":"2024-04-20T01:14:14.050Z","logger":"controllers.RayService","msg":"Done reconcileRayCluster update status, enter next loop to create new ray cluster.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"a7afdd7c-47d2-4012-be34-18a62df2936f"}
{"level":"info","ts":"2024-04-20T01:14:16.051Z","logger":"controllers.RayService","msg":"Creating a new pending RayCluster instance.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"afbab1ea-067b-4d31-8b07-553026007b3a"}
{"level":"info","ts":"2024-04-20T01:14:16.051Z","logger":"controllers.RayService","msg":"createRayClusterInstance","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"afbab1ea-067b-4d31-8b07-553026007b3a","rayClusterInstanceName":"rayservice-sample-raycluster-9s5d7"}
{"level":"info","ts":"2024-04-20T01:14:16.051Z","logger":"controllers.RayService","msg":"No pending RayCluster, creating RayCluster.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"afbab1ea-067b-4d31-8b07-553026007b3a"}
{"level":"info","ts":"2024-04-20T01:14:16.063Z","logger":"KubeAPIWarningLogger","msg":"unknown field \"spec.headGroupSpec.template.metadata.creationTimestamp\""}
{"level":"info","ts":"2024-04-20T01:14:16.063Z","logger":"KubeAPIWarningLogger","msg":"unknown field \"spec.workerGroupSpecs[0].template.metadata.creationTimestamp\""}
{"level":"info","ts":"2024-04-20T01:14:16.064Z","logger":"controllers.RayService","msg":"created rayCluster for rayService","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"afbab1ea-067b-4d31-8b07-553026007b3a","rayCluster":{"namespace":"rubrik-spark","name":"rayservice-sample-raycluster-9s5d7"}}
{"level":"info","ts":"2024-04-20T01:14:16.064Z","logger":"controllers.RayService","msg":"Check the head Pod status of the pending RayCluster","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"afbab1ea-067b-4d31-8b07-553026007b3a","RayCluster name":"rayservice-sample-raycluster-9s5d7"}
{"level":"info","ts":"2024-04-20T01:14:16.064Z","logger":"controllers.RayCluster","msg":"Reconciling Ingress","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265"}
{"level":"error","ts":"2024-04-20T01:14:16.064Z","logger":"controllers.RayService","msg":"Failed to check if head Pod is running and ready!","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"afbab1ea-067b-4d31-8b07-553026007b3a","error":"Found 0 head pods for RayCluster rayservice-sample-raycluster-9s5d7 in the namespace rubrik-spark","stacktrace":"github.com/ray-project/kuberay/ray-operator/controllers/ray.(*RayServiceReconciler).reconcileServe\n\t/home/runner/work/kuberay/kuberay/ray-operator/controllers/ray/rayservice_controller.go:1069\ngithub.com/ray-project/kuberay/ray-operator/controllers/ray.(*RayServiceReconciler).Reconcile\n\t/home/runner/work/kuberay/kuberay/ray-operator/controllers/ray/rayservice_controller.go:168\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Reconcile\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:119\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).reconcileHandler\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:316\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).processNextWorkItem\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:266\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Start.func2.2\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:227"}
{"level":"error","ts":"2024-04-20T01:14:16.064Z","logger":"controllers.RayService","msg":"Fail to reconcileServe.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"afbab1ea-067b-4d31-8b07-553026007b3a","error":"Found 0 head pods for RayCluster rayservice-sample-raycluster-9s5d7 in the namespace rubrik-spark","stacktrace":"github.com/ray-project/kuberay/ray-operator/controllers/ray.(*RayServiceReconciler).Reconcile\n\t/home/runner/work/kuberay/kuberay/ray-operator/controllers/ray/rayservice_controller.go:169\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Reconcile\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:119\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).reconcileHandler\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:316\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).processNextWorkItem\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:266\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Start.func2.2\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:227"}
{"level":"info","ts":"2024-04-20T01:14:16.065Z","logger":"controllers.RayService","msg":"Check the head Pod status of the pending RayCluster","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"3354d6f3-9a15-4a87-b56b-9eb7c809f7f1","RayCluster name":"rayservice-sample-raycluster-9s5d7"}
{"level":"error","ts":"2024-04-20T01:14:16.066Z","logger":"controllers.RayService","msg":"Failed to check if head Pod is running and ready!","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"3354d6f3-9a15-4a87-b56b-9eb7c809f7f1","error":"Found 0 head pods for RayCluster rayservice-sample-raycluster-9s5d7 in the namespace rubrik-spark","stacktrace":"github.com/ray-project/kuberay/ray-operator/controllers/ray.(*RayServiceReconciler).reconcileServe\n\t/home/runner/work/kuberay/kuberay/ray-operator/controllers/ray/rayservice_controller.go:1069\ngithub.com/ray-project/kuberay/ray-operator/controllers/ray.(*RayServiceReconciler).Reconcile\n\t/home/runner/work/kuberay/kuberay/ray-operator/controllers/ray/rayservice_controller.go:168\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Reconcile\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:119\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).reconcileHandler\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:316\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).processNextWorkItem\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:266\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Start.func2.2\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:227"}
{"level":"error","ts":"2024-04-20T01:14:16.066Z","logger":"controllers.RayService","msg":"Fail to reconcileServe.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"3354d6f3-9a15-4a87-b56b-9eb7c809f7f1","error":"Found 0 head pods for RayCluster rayservice-sample-raycluster-9s5d7 in the namespace rubrik-spark","stacktrace":"github.com/ray-project/kuberay/ray-operator/controllers/ray.(*RayServiceReconciler).Reconcile\n\t/home/runner/work/kuberay/kuberay/ray-operator/controllers/ray/rayservice_controller.go:169\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Reconcile\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:119\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).reconcileHandler\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:316\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).processNextWorkItem\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:266\nsigs.k8s.io/controller-runtime/pkg/internal/controller.(*Controller).Start.func2.2\n\t/home/runner/go/pkg/mod/sigs.k8s.io/controller-runtime@v0.16.3/pkg/internal/controller/controller.go:227"}
{"level":"info","ts":"2024-04-20T01:14:16.106Z","logger":"controllers.RayCluster","msg":"Pod Service created successfully","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","service name":"rayservice-sample-raycluster-9s5d7-head-svc"}
{"level":"info","ts":"2024-04-20T01:14:16.107Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","Found 0 head Pods; creating a head Pod for the RayCluster.":"rayservice-sample-raycluster-9s5d7"}
{"level":"info","ts":"2024-04-20T01:14:16.107Z","logger":"controllers.RayCluster","msg":"head pod labels","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","labels":{"app.kubernetes.io/created-by":"kuberay-operator","app.kubernetes.io/name":"kuberay","ray.io/cluster":"rayservice-sample-raycluster-9s5d7","ray.io/group":"headgroup","ray.io/identifier":"rayservice-sample-raycluster-9s5d7-head","ray.io/is-ray-node":"yes","ray.io/node-type":"head"}}
{"level":"info","ts":"2024-04-20T01:14:16.107Z","logger":"controllers.RayCluster","msg":"generateRayStartCommand","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","nodeType":"head","rayStartParams":{"block":"true","dashboard-agent-listen-port":"52365","dashboard-host":"0.0.0.0","metrics-export-port":"8080"},"Ray container resource":{"limits":{"cpu":"2","memory":"2Gi"},"requests":{"cpu":"2","memory":"2Gi"}}}
{"level":"info","ts":"2024-04-20T01:14:16.107Z","logger":"controllers.RayCluster","msg":"generateRayStartCommand","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","rayStartCmd":"ray start --head --dashboard-agent-listen-port=52365 --num-cpus=2 --memory=2147483648 --dashboard-host=0.0.0.0 --metrics-export-port=8080 --block "}
{"level":"info","ts":"2024-04-20T01:14:16.107Z","logger":"controllers.RayCluster","msg":"BuildPod","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","rayNodeType":"head","generatedCmd":"ulimit -n 65536; ray start --head --dashboard-agent-listen-port=52365 --num-cpus=2 --memory=2147483648 --dashboard-host=0.0.0.0 --metrics-export-port=8080 --block "}
{"level":"info","ts":"2024-04-20T01:14:16.107Z","logger":"controllers.RayCluster","msg":"Probes injection feature flag","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","enabled":true}
{"level":"info","ts":"2024-04-20T01:14:16.107Z","logger":"controllers.RayCluster","msg":"createHeadPod","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","head pod with name":"rayservice-sample-raycluster-9s5d7-head-"}
{"level":"info","ts":"2024-04-20T01:14:16.150Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","desired workerReplicas (always adhering to minReplicas/maxReplica)":1,"worker group":"small-group","maxReplicas":50,"minReplicas":1,"replicas":1}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","removing the pods in the scaleStrategy of":"small-group"}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","workerReplicas":1,"runningPods":0,"diff":1}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","Number workers to add":1,"Worker group":"small-group"}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","creating worker for group":"small-group","index 0":"in total 1"}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"generateRayStartCommand","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","nodeType":"worker","rayStartParams":{"address":"rayservice-sample-raycluster-9s5d7-head-svc.rubrik-spark.svc.cluster.local:6379","block":"true","dashboard-agent-listen-port":"52365","metrics-export-port":"8080"},"Ray container resource":{"limits":{"cpu":"3","memory":"2Gi"},"requests":{"cpu":"3","memory":"2Gi"}}}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"generateRayStartCommand","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","rayStartCmd":"ray start --address=rayservice-sample-raycluster-9s5d7-head-svc.rubrik-spark.svc.cluster.local:6379 --metrics-export-port=8080 --block --dashboard-agent-listen-port=52365 --num-cpus=3 --memory=2147483648 "}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"BuildPod","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","rayNodeType":"worker","generatedCmd":"ulimit -n 65536; ray start --address=rayservice-sample-raycluster-9s5d7-head-svc.rubrik-spark.svc.cluster.local:6379 --metrics-export-port=8080 --block --dashboard-agent-listen-port=52365 --num-cpus=3 --memory=2147483648 "}
{"level":"info","ts":"2024-04-20T01:14:16.151Z","logger":"controllers.RayCluster","msg":"Probes injection feature flag","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","enabled":true}
{"level":"info","ts":"2024-04-20T01:14:16.174Z","logger":"controllers.RayCluster","msg":"Created pod","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","Pod ":"ervice-sample-raycluster-9s5d7-worker-small-group-"}
{"level":"info","ts":"2024-04-20T01:14:16.175Z","logger":"controllers.RayCluster","msg":"CheckAllPodsRunning: Pod is not running; Pod Name: rayservice-sample-raycluster-9s5d7-head-z5st7; Pod Status.Phase: Pending","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265"}
{"level":"info","ts":"2024-04-20T01:14:16.176Z","logger":"controllers.RayCluster","msg":"inconsistentRayClusterStatus","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","detect inconsistency":"old AvailableWorkerReplicas: 0, new AvailableWorkerReplicas: 0, old DesiredWorkerReplicas: 0, new DesiredWorkerReplicas: 1, old MinWorkerReplicas: 0, new MinWorkerReplicas: 1, old MaxWorkerReplicas: 0, new MaxWorkerReplicas: 50"}
{"level":"info","ts":"2024-04-20T01:14:16.176Z","logger":"controllers.RayCluster","msg":"rayClusterReconcile","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","Update CR status":"rayservice-sample-raycluster-9s5d7","status":{"desiredWorkerReplicas":1,"minWorkerReplicas":1,"maxWorkerReplicas":50,"desiredCPU":"5","desiredMemory":"4Gi","desiredGPU":"0","desiredTPU":"0","lastUpdateTime":"2024-04-20T01:14:16Z","endpoints":{"client":"10001","dashboard":"8265","gcs-server":"6379","metrics":"8080","serve":"8000"},"head":{"serviceIP":"10.92.15.52"},"observedGeneration":1}}
{"level":"info","ts":"2024-04-20T01:14:16.251Z","logger":"controllers.RayCluster","msg":"Environment variable RAYCLUSTER_DEFAULT_REQUEUE_SECONDS_ENV is not set, using default value of 300 seconds","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","cluster name":"rayservice-sample-raycluster-9s5d7"}
{"level":"info","ts":"2024-04-20T01:14:16.251Z","logger":"controllers.RayCluster","msg":"Unconditional requeue after","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"07f82f27-a29c-41fc-a2eb-a5ce955d4265","cluster name":"rayservice-sample-raycluster-9s5d7","seconds":300}
{"level":"info","ts":"2024-04-20T01:14:16.251Z","logger":"controllers.RayCluster","msg":"Reconciling Ingress","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc"}
{"level":"info","ts":"2024-04-20T01:14:16.251Z","logger":"controllers.RayCluster","msg":"reconcileHeadService","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","1 head service found":"rayservice-sample-raycluster-9s5d7-head-svc"}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","Found 1 head Pod":"rayservice-sample-raycluster-9s5d7-head-z5st7","Pod status":"Pending","Pod restart policy":"Always","Ray container terminated status":"nil"}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","head Pod":"rayservice-sample-raycluster-9s5d7-head-z5st7","shouldDelete":false,"reason":"KubeRay does not need to delete the head Pod rayservice-sample-raycluster-9s5d7-head-z5st7. The Pod status is Pending, and the Ray container terminated status is nil."}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","desired workerReplicas (always adhering to minReplicas/maxReplica)":1,"worker group":"small-group","maxReplicas":50,"minReplicas":1,"replicas":1}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","worker Pod":"ervice-sample-raycluster-9s5d7-worker-small-group-5zqcc","shouldDelete":false,"reason":"KubeRay does not need to delete the worker Pod ervice-sample-raycluster-9s5d7-worker-small-group-5zqcc. The Pod status is Pending, and the Ray container terminated status is nil."}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","removing the pods in the scaleStrategy of":"small-group"}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","workerReplicas":1,"runningPods":1,"diff":0}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayCluster","msg":"reconcilePods","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","all workers already exist for group":"small-group"}
{"level":"info","ts":"2024-04-20T01:14:16.252Z","logger":"controllers.RayService","msg":"Check the head Pod status of the pending RayCluster","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"5935e12d-dfe7-4c36-9bf7-56bc5a3858a7","RayCluster name":"rayservice-sample-raycluster-9s5d7"}
{"level":"info","ts":"2024-04-20T01:14:16.253Z","logger":"controllers.RayCluster","msg":"CheckAllPodsRunning: Pod is not running; Pod Name: rayservice-sample-raycluster-9s5d7-head-z5st7; Pod Status.Phase: Pending","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc"}
{"level":"info","ts":"2024-04-20T01:14:16.253Z","logger":"controllers.RayService","msg":"Skipping the update of Serve deployments because the Ray head Pod is not ready.","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"5935e12d-dfe7-4c36-9bf7-56bc5a3858a7"}
{"level":"info","ts":"2024-04-20T01:14:16.253Z","logger":"controllers.RayService","msg":"Ray Serve applications are not ready to serve requests: checking again in 2ss","RayService":{"name":"rayservice-sample","namespace":"rubrik-spark"},"reconcileID":"5935e12d-dfe7-4c36-9bf7-56bc5a3858a7"}
{"level":"info","ts":"2024-04-20T01:14:16.254Z","logger":"controllers.RayCluster","msg":"inconsistentRayClusterStatus","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","detect inconsistency":"old AvailableWorkerReplicas: 0, new AvailableWorkerReplicas: 0, old DesiredWorkerReplicas: 0, new DesiredWorkerReplicas: 1, old MinWorkerReplicas: 0, new MinWorkerReplicas: 1, old MaxWorkerReplicas: 0, new MaxWorkerReplicas: 50"}
{"level":"info","ts":"2024-04-20T01:14:16.254Z","logger":"controllers.RayCluster","msg":"rayClusterReconcile","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","Update CR status":"rayservice-sample-raycluster-9s5d7","status":{"desiredWorkerReplicas":1,"minWorkerReplicas":1,"maxWorkerReplicas":50,"desiredCPU":"5","desiredMemory":"4Gi","desiredGPU":"0","desiredTPU":"0","lastUpdateTime":"2024-04-20T01:14:16Z","endpoints":{"client":"10001","dashboard":"8265","gcs-server":"6379","metrics":"8080","serve":"8000"},"head":{"serviceIP":"10.92.15.52"},"observedGeneration":1}}
{"level":"info","ts":"2024-04-20T01:14:16.262Z","logger":"controllers.RayCluster","msg":"Got error when updating status","RayCluster":{"name":"rayservice-sample-raycluster-9s5d7","namespace":"rubrik-spark"},"reconcileID":"44413d62-4bfb-4ea0-81cb-492cc75b00fc","cluster name":"rayservice-sample-raycluster-9s5d7","error":"Operation cannot be fulfilled on rayclusters.ray.io \"rayservice-sample-raycluster-9s5d7\": the object has been modified; please apply your changes to the latest version and try again","RayCluster":{"apiVersion":"ray.io/v1","kind":"RayCluster","namespace":"rubrik-spark","name":"rayservice-sample-raycluster-9s5d7"}}