Skip to content

Commit

Permalink
updating EFA_DEVICE details for AWS resources (#791)
Browse files Browse the repository at this point in the history
Co-authored-by: Alexander Jipa <[email protected]>
  • Loading branch information
Alexander Jipa and azzhipa authored Nov 20, 2023
1 parent 8048ef3 commit caba46a
Showing 1 changed file with 54 additions and 14 deletions.
68 changes: 54 additions & 14 deletions torchx/specs/named_resources_aws.py
Original file line number Diff line number Diff line change
Expand Up @@ -137,25 +137,41 @@ def aws_g4dn_4xlarge() -> Resource:

def aws_g4dn_8xlarge() -> Resource:
return Resource(
cpu=32, gpu=1, memMB=128 * GiB, capabilities={K8S_ITYPE: "g4dn.8xlarge"}
cpu=32,
gpu=1,
memMB=128 * GiB,
capabilities={K8S_ITYPE: "g4dn.8xlarge"},
devices={EFA_DEVICE: 1},
)


def aws_g4dn_16xlarge() -> Resource:
def aws_g4dn_12xlarge() -> Resource:
return Resource(
cpu=64, gpu=1, memMB=256 * GiB, capabilities={K8S_ITYPE: "g4dn.16xlarge"}
cpu=48,
gpu=4,
memMB=192 * GiB,
capabilities={K8S_ITYPE: "g4dn.12xlarge"},
devices={EFA_DEVICE: 1},
)


def aws_g4dn_12xlarge() -> Resource:
def aws_g4dn_16xlarge() -> Resource:
return Resource(
cpu=48, gpu=4, memMB=192 * GiB, capabilities={K8S_ITYPE: "g4dn.12xlarge"}
cpu=64,
gpu=1,
memMB=256 * GiB,
capabilities={K8S_ITYPE: "g4dn.16xlarge"},
devices={EFA_DEVICE: 1},
)


def aws_g4dn_metal() -> Resource:
return Resource(
cpu=96, gpu=8, memMB=384 * GiB, capabilities={K8S_ITYPE: "g4dn.metal"}
cpu=96,
gpu=8,
memMB=384 * GiB,
capabilities={K8S_ITYPE: "g4dn.metal"},
devices={EFA_DEVICE: 1},
)


Expand All @@ -177,31 +193,51 @@ def aws_g5_4xlarge() -> Resource:

def aws_g5_8xlarge() -> Resource:
return Resource(
cpu=32, gpu=1, memMB=128 * GiB, capabilities={K8S_ITYPE: "g5.8xlarge"}
cpu=32,
gpu=1,
memMB=128 * GiB,
capabilities={K8S_ITYPE: "g5.8xlarge"},
devices={EFA_DEVICE: 1},
)


def aws_g5_16xlarge() -> Resource:
def aws_g5_12xlarge() -> Resource:
return Resource(
cpu=64, gpu=1, memMB=256 * GiB, capabilities={K8S_ITYPE: "g5.16xlarge"}
cpu=48,
gpu=4,
memMB=192 * GiB,
capabilities={K8S_ITYPE: "g5.12xlarge"},
devices={EFA_DEVICE: 1},
)


def aws_g5_12xlarge() -> Resource:
def aws_g5_16xlarge() -> Resource:
return Resource(
cpu=48, gpu=4, memMB=192 * GiB, capabilities={K8S_ITYPE: "g5.12xlarge"}
cpu=64,
gpu=1,
memMB=256 * GiB,
capabilities={K8S_ITYPE: "g5.16xlarge"},
devices={EFA_DEVICE: 1},
)


def aws_g5_24xlarge() -> Resource:
return Resource(
cpu=96, gpu=4, memMB=384 * GiB, capabilities={K8S_ITYPE: "g5.24xlarge"}
cpu=96,
gpu=4,
memMB=384 * GiB,
capabilities={K8S_ITYPE: "g5.24xlarge"},
devices={EFA_DEVICE: 1},
)


def aws_g5_48xlarge() -> Resource:
return Resource(
cpu=192, gpu=8, memMB=768 * GiB, capabilities={K8S_ITYPE: "g5.48xlarge"}
cpu=192,
gpu=8,
memMB=768 * GiB,
capabilities={K8S_ITYPE: "g5.48xlarge"},
devices={EFA_DEVICE: 1},
)


Expand All @@ -213,7 +249,11 @@ def aws_trn1_2xlarge() -> Resource:

def aws_trn1_32xlarge() -> Resource:
return Resource(
cpu=128, gpu=0, memMB=512 * GiB, capabilities={K8S_ITYPE: "trn1.32xlarge"}
cpu=128,
gpu=0,
memMB=512 * GiB,
capabilities={K8S_ITYPE: "trn1.32xlarge"},
devices={EFA_DEVICE: 8},
)


Expand Down

0 comments on commit caba46a

Please sign in to comment.