Yong Wu commited on
Commit
d5ff5a1
·
1 Parent(s): 98e2462

inputs from SGL serving

Browse files
bs1/request_001/gemm1_weights.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee5e75db7dff7beeecca982ce4c7ea441c28c8321ddd3474761ed1beef96bbe7
3
+ size 1409635545
bs1/request_001/gemm1_weights_scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7c7170f48b855553528c1e1764666cfe867a8e2ec310845c153e8dd2e150ba9
3
+ size 1409635605
bs1/request_001/gemm2_weights.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:953a6c64e452fc9ba80ebbd028f0b5b4bc669916a257202535da00cf053aa9f2
3
+ size 1409635545
bs1/request_001/gemm2_weights_scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47d21dcaafea4a0a754145e09e06c392e875ff4ff2644b69df5d409798dd9dff
3
+ size 1409635605
bs1/request_001/hidden_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff5dcdfecb4e17ed63ca544fac0cff282638170799416461caa5f09e134e58de
3
+ size 109203
bs1/request_001/hidden_states_scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b606d073dd93381419f3c0d39b475f7d99d1ebe13a372b1f71ee9cd41ad99bfc
3
+ size 4989
bs1/request_001/routing_bias.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a11aef9dba200f6f365e06af25c8d1c94025821591b12e21286443fce234e9f
3
+ size 2124
bs1/request_001/routing_logits.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5353243e196d9f0b2a2f05805268038c2a6eb9017d62690ec5b1d01f435eb307
3
+ size 16986
bs1/request_001/scalar.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "request_id": "001",
3
+ "timestamp": "2025-09-23T05:33:14.358360",
4
+ "num_experts": 256,
5
+ "top_k": 8,
6
+ "n_group": 8,
7
+ "topk_group": 4,
8
+ "intermediate_size": 256,
9
+ "local_expert_offset": 0,
10
+ "local_num_experts": 256,
11
+ "routed_scaling_factor": 2.5,
12
+ "tile_tokens_dim": 8,
13
+ "routing_method_type": 2,
14
+ "use_shuffled_weight": false,
15
+ "weight_layout": 0,
16
+ "enable_pdl": null
17
+ }
bs16/request_001/gemm1_weights.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98e23f847973e4d8d90df0fd5bbc6af5398785555e54c363ba09f9a17106c2c9
3
+ size 1409635545
bs16/request_001/gemm1_weights_scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cad9d9790ff7ab42646f53e2bd091556b3e0970abd80c50553953398c4aa964e
3
+ size 1409635605
bs16/request_001/gemm2_weights.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e93148ef152ca02cd710d13649411dc09b72e2fa25cf05f9f95defd703971542
3
+ size 1409635545
bs16/request_001/gemm2_weights_scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1d7f9efd62c35aa6ef9f952a0ca351c3be48fec7eb366dbacd27af74527092d
3
+ size 1409635605
bs16/request_001/hidden_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbc34a294f5a4106d44f8c5963a2ae0e7344effb6a560f861ace4b389b9304aa
3
+ size 4524691
bs16/request_001/hidden_states_scale.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:402bcf6b5db460e1f14be6a0f5436204d2b942b0ba704078e1ef25351a25e40d
3
+ size 142973
bs16/request_001/routing_bias.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d925815d772b3a942e760ea8a63a857dc5db5b39c2c36d8101b60ac5df39db4e
3
+ size 2124
bs16/request_001/routing_logits.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c6a0bcd39dc8dc02c878e8783ae702131b1c6958ae5bae6eda9f016a9a54516
3
+ size 647770
bs16/request_001/scalar.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "request_id": "001",
3
+ "timestamp": "2025-09-23T05:42:55.714241",
4
+ "num_experts": 256,
5
+ "top_k": 8,
6
+ "n_group": 8,
7
+ "topk_group": 4,
8
+ "intermediate_size": 256,
9
+ "local_expert_offset": 0,
10
+ "local_num_experts": 256,
11
+ "routed_scaling_factor": 2.5,
12
+ "tile_tokens_dim": 32,
13
+ "routing_method_type": 2,
14
+ "use_shuffled_weight": false,
15
+ "weight_layout": 0,
16
+ "enable_pdl": null
17
+ }