<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Alerting on Long running pods in Container platforms</title>
    <link>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265312#M2814</link>
    <description>&lt;P&gt;&lt;a href="https://community.dynatrace.com/t5/user/viewprofilepage/user-id/64457"&gt;@PujithAnne&lt;/a&gt;&amp;nbsp;can you please describe the alert scenario in a bit of detail so we can advise.&lt;BR /&gt;Is there a specific scenario that you are trying to capture (not just that it's running longer than xx).&lt;BR /&gt;&lt;BR /&gt;I'm assuming that you are looking for an alert where a pod or a job has not terminated and is left&amp;nbsp; in a 'terminating' status? these are covered by default&lt;BR /&gt;&lt;BR /&gt;Or is this really a pod has not received a termination&amp;nbsp; &amp;nbsp;signal and is left running.&amp;nbsp; - this would not be covered and you'd need some custom metrics and alerts to capture this.&amp;nbsp;&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
    <pubDate>Mon, 16 Dec 2024 04:35:36 GMT</pubDate>
    <dc:creator>gopher</dc:creator>
    <dc:date>2024-12-16T04:35:36Z</dc:date>
    <item>
      <title>Alerting on Long running pods</title>
      <link>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265305#M2811</link>
      <description>&lt;P&gt;Hi Team,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is there any alerting option to alert for long&amp;nbsp;running pod in Kubernetes?&lt;/P&gt;</description>
      <pubDate>Sun, 15 Dec 2024 18:55:57 GMT</pubDate>
      <guid>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265305#M2811</guid>
      <dc:creator>PujithAnne</dc:creator>
      <dc:date>2024-12-15T18:55:57Z</dc:date>
    </item>
    <item>
      <title>Re: Alerting on Long running pods</title>
      <link>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265306#M2812</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.dynatrace.com/t5/user/viewprofilepage/user-id/64457"&gt;@PujithAnne&lt;/a&gt;&amp;nbsp;,&lt;BR /&gt;Can you please explain further on what exactly you mean by alert for long running pods ?&lt;BR /&gt;You want to be alerted if a pod runs more than x days?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Sun, 15 Dec 2024 20:36:16 GMT</pubDate>
      <guid>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265306#M2812</guid>
      <dc:creator>Maheedhar_T</dc:creator>
      <dc:date>2024-12-15T20:36:16Z</dc:date>
    </item>
    <item>
      <title>Re: Alerting on Long running pods</title>
      <link>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265310#M2813</link>
      <description>&lt;P&gt;Yes, i want to get alert for pods under specific namespace over a 1 days.&lt;/P&gt;</description>
      <pubDate>Mon, 16 Dec 2024 02:09:35 GMT</pubDate>
      <guid>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265310#M2813</guid>
      <dc:creator>PujithAnne</dc:creator>
      <dc:date>2024-12-16T02:09:35Z</dc:date>
    </item>
    <item>
      <title>Re: Alerting on Long running pods</title>
      <link>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265312#M2814</link>
      <description>&lt;P&gt;&lt;a href="https://community.dynatrace.com/t5/user/viewprofilepage/user-id/64457"&gt;@PujithAnne&lt;/a&gt;&amp;nbsp;can you please describe the alert scenario in a bit of detail so we can advise.&lt;BR /&gt;Is there a specific scenario that you are trying to capture (not just that it's running longer than xx).&lt;BR /&gt;&lt;BR /&gt;I'm assuming that you are looking for an alert where a pod or a job has not terminated and is left&amp;nbsp; in a 'terminating' status? these are covered by default&lt;BR /&gt;&lt;BR /&gt;Or is this really a pod has not received a termination&amp;nbsp; &amp;nbsp;signal and is left running.&amp;nbsp; - this would not be covered and you'd need some custom metrics and alerts to capture this.&amp;nbsp;&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 16 Dec 2024 04:35:36 GMT</pubDate>
      <guid>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265312#M2814</guid>
      <dc:creator>gopher</dc:creator>
      <dc:date>2024-12-16T04:35:36Z</dc:date>
    </item>
    <item>
      <title>Re: Alerting on Long running pods</title>
      <link>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265316#M2815</link>
      <description>&lt;P&gt;We have pods running a job that needs to be completed and needs to get terminated in 2-3hrs. We are seeing pods that are running for over than 12 hours consuming resources on kubernetes cluster. I have delete the pods if it's older than 1 days to reduce the resource consumption.&lt;BR /&gt;&lt;BR /&gt;Thanks,&lt;/P&gt;&lt;P&gt;Pujith&lt;/P&gt;</description>
      <pubDate>Mon, 16 Dec 2024 05:31:51 GMT</pubDate>
      <guid>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265316#M2815</guid>
      <dc:creator>PujithAnne</dc:creator>
      <dc:date>2024-12-16T05:31:51Z</dc:date>
    </item>
    <item>
      <title>Re: Alerting on Long running pods</title>
      <link>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265317#M2816</link>
      <description>&lt;P&gt;&lt;a href="https://community.dynatrace.com/t5/user/viewprofilepage/user-id/64457"&gt;@PujithAnne&lt;/a&gt;&amp;nbsp;,&lt;BR /&gt;&lt;BR /&gt;out of the box, you're probably up the creek without a paddle.&amp;nbsp; uptime isn't kept as a searchable counter (as far as I know).&amp;nbsp; there is an uptime counter in Prometheus for kube pod metrics you could look at, but not sure if there would be suitable logic in grail to work out if it's above a set value (pre-calculated).&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;alternatively - you can use Kubernetes native methods like activeDeadlineSeconds to specify the maximum running time of a pod in your deployment spec.&lt;BR /&gt;&amp;nbsp;***use with extreme caution*** if time is up, it will terminate the pod. but you'll get what you're after and pod won't run for longer than expected.&amp;nbsp; you could theoretically set it for say '6 hours' or something at a point where you would consider it a lost cause and effectively safe to terminate.&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;PRE&gt;apiVersion: v1
kind: Pod
metadata:
  name: example-pod
spec:
  activeDeadlineSeconds: 3600  # Pod will be terminated after 1 hour (3600 seconds)&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;BR /&gt;Good luck&lt;/P&gt;</description>
      <pubDate>Mon, 16 Dec 2024 05:50:17 GMT</pubDate>
      <guid>https://community.dynatrace.com/t5/Container-platforms/Alerting-on-Long-running-pods/m-p/265317#M2816</guid>
      <dc:creator>gopher</dc:creator>
      <dc:date>2024-12-16T05:50:17Z</dc:date>
    </item>
  </channel>
</rss>

