> ## Documentation Index
> Fetch the complete documentation index at: https://runpod-b18f5ded-lg-apiv2-new.mintlify.site/llms.txt
> Use this file to discover all available pages before exploring further.

# List serverless endpoint workers

> Returns the active workers for a serverless endpoint plus a summary of
worker counts. Each worker's `status` is derived by reconciling the
worker pod's lifecycle status with the endpoint's live job-queue view.
When the job-queue view is unavailable the response degrades to the
pod-derived status and counts.




## OpenAPI

````yaml get /v2/serverless/{id}/workers
openapi: 3.0.3
info:
  title: RunPod REST API
  version: 2.0.0
  description: RunPod public REST API — v2
servers:
  - url: /
    description: Current server
security:
  - bearerAuth: []
paths:
  /v2/serverless/{id}/workers:
    parameters:
      - name: id
        in: path
        required: true
        schema:
          type: string
        description: Serverless endpoint identifier
        example: ep_abc123
    get:
      tags:
        - Serverless
      summary: List serverless endpoint workers
      description: |
        Returns the active workers for a serverless endpoint plus a summary of
        worker counts. Each worker's `status` is derived by reconciling the
        worker pod's lifecycle status with the endpoint's live job-queue view.
        When the job-queue view is unavailable the response degrades to the
        pod-derived status and counts.
      operationId: listEndpointWorkers
      responses:
        '200':
          description: OK
          content:
            application/json:
              schema:
                $ref: '#/components/schemas/ListEndpointWorkersResponse'
        '404':
          description: Serverless endpoint not found
          content:
            application/problem+json:
              schema:
                $ref: '#/components/schemas/ErrorResponse'
        default:
          description: Error
          content:
            application/problem+json:
              schema:
                $ref: '#/components/schemas/ErrorResponse'
components:
  schemas:
    ListEndpointWorkersResponse:
      type: object
      required:
        - workers
        - summary
      properties:
        workers:
          type: array
          items:
            $ref: '#/components/schemas/Worker'
        summary:
          $ref: '#/components/schemas/WorkerSummary'
        endpointVersion:
          type: integer
          nullable: true
          description: |
            The endpoint's current configuration version. A worker whose
            `version` differs is running stale config (see `worker.isStale`).
            Null if unknown.
          example: 4
    ErrorResponse:
      type: object
      properties:
        title:
          type: string
          description: Short human-readable summary
          example: Not Found
        status:
          type: integer
          description: HTTP status code
          example: 404
        detail:
          type: string
          description: Human-readable explanation
          example: pod not found
    Worker:
      type: object
      required:
        - id
        - status
        - gpuCount
        - isStale
      properties:
        id:
          type: string
          example: worker_abc
        status:
          $ref: '#/components/schemas/WorkerStatus'
        isStale:
          type: boolean
          description: >
            True when the worker is running an older endpoint configuration than

            the current one (e.g. mid rolling-update). This is the authoritative

            flag: it is derived from `version` vs the response's
            `endpointVersion`,

            except on legacy endpoints (`endpointVersion` 1) where it falls back

            to a container-image comparison.
          example: false
        version:
          type: integer
          nullable: true
          description: |
            Endpoint configuration version this worker is running. Compare with
            the response's `endpointVersion`. Null if unknown.
          example: 4
        gpuCount:
          type: integer
          minimum: 0
          description: GPUs allocated to the worker.
          example: 1
        image:
          type: string
          nullable: true
          description: Container image the worker is running.
          example: my-org/sdxl-worker:latest
        uptimeSeconds:
          type: integer
          minimum: 0
          nullable: true
          description: >-
            Seconds the worker has been running. Null until the worker is placed
            and running.
          example: 3600
        gpuTypeId:
          type: string
          nullable: true
          description: GPU type the worker is placed on. Null until the worker is placed.
          example: NVIDIA RTX 4090
        dataCenterId:
          type: string
          nullable: true
          description: >-
            Data center the worker is placed in. Null until the worker is
            placed.
          example: US-TX-3
        startedAt:
          type: string
          format: date-time
          nullable: true
          description: When the worker last started. Null if it has not started.
          example: '2026-03-26T00:00:00Z'
    WorkerSummary:
      type: object
      description: |
        Histogram of the returned workers by status. The per-status counts are a
        roll-up of the `workers` array, so `running + idle + initializing +
        throttled + unhealthy == total == len(workers)`.
      required:
        - running
        - idle
        - initializing
        - throttled
        - unhealthy
        - total
      properties:
        running:
          type: integer
          minimum: 0
          description: Workers actively processing a job.
          example: 2
        idle:
          type: integer
          minimum: 0
          description: Ready workers polling for jobs.
          example: 1
        initializing:
          type: integer
          minimum: 0
          description: Workers starting up, not yet ready.
          example: 0
        throttled:
          type: integer
          minimum: 0
          description: Workers waiting on compute capacity.
          example: 0
        unhealthy:
          type: integer
          minimum: 0
          description: Workers failing health checks.
          example: 0
        total:
          type: integer
          minimum: 0
          description: All workers currently allocated to the endpoint.
          example: 3
    WorkerStatus:
      type: string
      description: |
        Derived worker state, reconciled from the worker pod's lifecycle status
        and the live job-queue view.
        - `RUNNING`      — actively processing a job
        - `IDLE`         — ready and polling for jobs
        - `INITIALIZING` — starting up, not yet ready
        - `THROTTLED`    — waiting on compute capacity
        - `UNHEALTHY`    — failing health checks
      x-enum-varnames:
        - WorkerStatusRunning
        - WorkerStatusIdle
        - WorkerStatusInitializing
        - WorkerStatusThrottled
        - WorkerStatusUnhealthy
      enum:
        - RUNNING
        - IDLE
        - INITIALIZING
        - THROTTLED
        - UNHEALTHY
  securitySchemes:
    bearerAuth:
      type: http
      scheme: bearer
      bearerFormat: RunPod API Key

````