We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8b79f68 commit a3ff52bCopy full SHA for a3ff52b
examples/offload/gke/benchmarks/deploy-cpu-offload.yaml
@@ -34,6 +34,12 @@ spec:
34
value: "4096"
35
- name: TPU_OFFLOAD_NUM_STAGING_BLOCKS
36
value: "256"
37
+ # config the pre-mapped CPU buffer for TPUs
38
+ # https://docs.cloud.google.com/tpu/docs/performance-guide#tpu_model_performance
39
+ - name: TPU_PREMAPPED_BUFFER_SIZE
40
+ value: "68719476736" # 64 GB
41
+ - name: TPU_PREMAPPED_BUFFER_TRANSFER_THRESHOLD_BYTES
42
43
ports:
44
- containerPort: 8000
45
resources:
0 commit comments