Skip to content

Commit

Permalink
update V1.0 benchmark manifest (#822)
Browse files Browse the repository at this point in the history
Co-authored-by: Zhenzhong1 <zhenzhong.xu@intel.com>
  • Loading branch information
chensuyue and Zhenzhong1 authored Sep 18, 2024
1 parent e2a74f7 commit e5affb9
Show file tree
Hide file tree
Showing 22 changed files with 38 additions and 70 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -134,7 +134,7 @@ metadata:
name: embedding-dependency-deploy
namespace: default
spec:
replicas: 1
replicas: 8
selector:
matchLabels:
app: embedding-dependency-deploy
Expand Down Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -134,7 +134,7 @@ metadata:
name: embedding-dependency-deploy
namespace: default
spec:
replicas: 1
replicas: 4
selector:
matchLabels:
app: embedding-dependency-deploy
Expand Down Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -134,7 +134,7 @@ metadata:
name: embedding-dependency-deploy
namespace: default
spec:
replicas: 1
replicas: 2
selector:
matchLabels:
app: embedding-dependency-deploy
Expand Down Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -134,7 +134,7 @@ metadata:
name: embedding-dependency-deploy
namespace: default
spec:
replicas: 1
replicas: 8
selector:
matchLabels:
app: embedding-dependency-deploy
Expand Down Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -134,7 +134,7 @@ metadata:
name: embedding-dependency-deploy
namespace: default
spec:
replicas: 1
replicas: 4
selector:
matchLabels:
app: embedding-dependency-deploy
Expand Down Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -134,7 +134,7 @@ metadata:
name: embedding-dependency-deploy
namespace: default
spec:
replicas: 1
replicas: 2
selector:
matchLabels:
app: embedding-dependency-deploy
Expand Down Expand Up @@ -223,10 +223,6 @@ spec:
- '2048'
- --max-total-tokens
- '4096'
- --max-batch-total-tokens
- '65536'
- --max-batch-prefill-tokens
- '4096'
env:
- name: OMPI_MCA_btl_vader_single_copy_mechanism
value: none
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -216,10 +216,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
serviceAccountName: default
volumes:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -216,10 +216,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
serviceAccountName: default
volumes:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -216,10 +216,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
serviceAccountName: default
volumes:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down Expand Up @@ -399,7 +399,7 @@ metadata:
name: retriever-deploy
namespace: default
spec:
replicas: 1
replicas: 2
selector:
matchLabels:
app: retriever-deploy
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,7 @@ metadata:
name: chatqna-backend-server-deploy
namespace: default
spec:
replicas: 4
replicas: 8
selector:
matchLabels:
app: chatqna-backend-server-deploy
Expand Down Expand Up @@ -141,7 +141,7 @@ metadata:
name: embedding-dependency-deploy
namespace: default
spec:
replicas: 4
replicas: 8
selector:
matchLabels:
app: embedding-dependency-deploy
Expand All @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down Expand Up @@ -313,7 +313,7 @@ metadata:
name: retriever-deploy
namespace: default
spec:
replicas: 4
replicas: 8
selector:
matchLabels:
app: retriever-deploy
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -167,10 +167,10 @@ spec:
- containerPort: 80
resources:
limits:
cpu: 80
cpu: 76
memory: 20000Mi
requests:
cpu: 80
cpu: 76
memory: 20000Mi
volumeMounts:
- mountPath: /data
Expand Down

0 comments on commit e5affb9

Please sign in to comment.