Yong Wu
commited on
Commit
·
d5ff5a1
1
Parent(s):
98e2462
inputs from SGL serving
Browse files- bs1/request_001/gemm1_weights.pt +3 -0
- bs1/request_001/gemm1_weights_scale.pt +3 -0
- bs1/request_001/gemm2_weights.pt +3 -0
- bs1/request_001/gemm2_weights_scale.pt +3 -0
- bs1/request_001/hidden_states.pt +3 -0
- bs1/request_001/hidden_states_scale.pt +3 -0
- bs1/request_001/routing_bias.pt +3 -0
- bs1/request_001/routing_logits.pt +3 -0
- bs1/request_001/scalar.json +17 -0
- bs16/request_001/gemm1_weights.pt +3 -0
- bs16/request_001/gemm1_weights_scale.pt +3 -0
- bs16/request_001/gemm2_weights.pt +3 -0
- bs16/request_001/gemm2_weights_scale.pt +3 -0
- bs16/request_001/hidden_states.pt +3 -0
- bs16/request_001/hidden_states_scale.pt +3 -0
- bs16/request_001/routing_bias.pt +3 -0
- bs16/request_001/routing_logits.pt +3 -0
- bs16/request_001/scalar.json +17 -0
bs1/request_001/gemm1_weights.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee5e75db7dff7beeecca982ce4c7ea441c28c8321ddd3474761ed1beef96bbe7
|
| 3 |
+
size 1409635545
|
bs1/request_001/gemm1_weights_scale.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b7c7170f48b855553528c1e1764666cfe867a8e2ec310845c153e8dd2e150ba9
|
| 3 |
+
size 1409635605
|
bs1/request_001/gemm2_weights.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:953a6c64e452fc9ba80ebbd028f0b5b4bc669916a257202535da00cf053aa9f2
|
| 3 |
+
size 1409635545
|
bs1/request_001/gemm2_weights_scale.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47d21dcaafea4a0a754145e09e06c392e875ff4ff2644b69df5d409798dd9dff
|
| 3 |
+
size 1409635605
|
bs1/request_001/hidden_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff5dcdfecb4e17ed63ca544fac0cff282638170799416461caa5f09e134e58de
|
| 3 |
+
size 109203
|
bs1/request_001/hidden_states_scale.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b606d073dd93381419f3c0d39b475f7d99d1ebe13a372b1f71ee9cd41ad99bfc
|
| 3 |
+
size 4989
|
bs1/request_001/routing_bias.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a11aef9dba200f6f365e06af25c8d1c94025821591b12e21286443fce234e9f
|
| 3 |
+
size 2124
|
bs1/request_001/routing_logits.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5353243e196d9f0b2a2f05805268038c2a6eb9017d62690ec5b1d01f435eb307
|
| 3 |
+
size 16986
|
bs1/request_001/scalar.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"request_id": "001",
|
| 3 |
+
"timestamp": "2025-09-23T05:33:14.358360",
|
| 4 |
+
"num_experts": 256,
|
| 5 |
+
"top_k": 8,
|
| 6 |
+
"n_group": 8,
|
| 7 |
+
"topk_group": 4,
|
| 8 |
+
"intermediate_size": 256,
|
| 9 |
+
"local_expert_offset": 0,
|
| 10 |
+
"local_num_experts": 256,
|
| 11 |
+
"routed_scaling_factor": 2.5,
|
| 12 |
+
"tile_tokens_dim": 8,
|
| 13 |
+
"routing_method_type": 2,
|
| 14 |
+
"use_shuffled_weight": false,
|
| 15 |
+
"weight_layout": 0,
|
| 16 |
+
"enable_pdl": null
|
| 17 |
+
}
|
bs16/request_001/gemm1_weights.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98e23f847973e4d8d90df0fd5bbc6af5398785555e54c363ba09f9a17106c2c9
|
| 3 |
+
size 1409635545
|
bs16/request_001/gemm1_weights_scale.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cad9d9790ff7ab42646f53e2bd091556b3e0970abd80c50553953398c4aa964e
|
| 3 |
+
size 1409635605
|
bs16/request_001/gemm2_weights.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e93148ef152ca02cd710d13649411dc09b72e2fa25cf05f9f95defd703971542
|
| 3 |
+
size 1409635545
|
bs16/request_001/gemm2_weights_scale.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1d7f9efd62c35aa6ef9f952a0ca351c3be48fec7eb366dbacd27af74527092d
|
| 3 |
+
size 1409635605
|
bs16/request_001/hidden_states.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cbc34a294f5a4106d44f8c5963a2ae0e7344effb6a560f861ace4b389b9304aa
|
| 3 |
+
size 4524691
|
bs16/request_001/hidden_states_scale.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:402bcf6b5db460e1f14be6a0f5436204d2b942b0ba704078e1ef25351a25e40d
|
| 3 |
+
size 142973
|
bs16/request_001/routing_bias.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d925815d772b3a942e760ea8a63a857dc5db5b39c2c36d8101b60ac5df39db4e
|
| 3 |
+
size 2124
|
bs16/request_001/routing_logits.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c6a0bcd39dc8dc02c878e8783ae702131b1c6958ae5bae6eda9f016a9a54516
|
| 3 |
+
size 647770
|
bs16/request_001/scalar.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"request_id": "001",
|
| 3 |
+
"timestamp": "2025-09-23T05:42:55.714241",
|
| 4 |
+
"num_experts": 256,
|
| 5 |
+
"top_k": 8,
|
| 6 |
+
"n_group": 8,
|
| 7 |
+
"topk_group": 4,
|
| 8 |
+
"intermediate_size": 256,
|
| 9 |
+
"local_expert_offset": 0,
|
| 10 |
+
"local_num_experts": 256,
|
| 11 |
+
"routed_scaling_factor": 2.5,
|
| 12 |
+
"tile_tokens_dim": 32,
|
| 13 |
+
"routing_method_type": 2,
|
| 14 |
+
"use_shuffled_weight": false,
|
| 15 |
+
"weight_layout": 0,
|
| 16 |
+
"enable_pdl": null
|
| 17 |
+
}
|