File tree Expand file tree Collapse file tree 3 files changed +79
-57
lines changed
QEfficient/diffusers/pipelines Expand file tree Collapse file tree 3 files changed +79
-57
lines changed Original file line number Diff line number Diff line change 3131 "execute" : {
3232 "device_ids" : null
3333 }
34- }
34+ },
35+ "vae_decoder" :{
36+ "specializations" : [
37+ {
38+ "batch_size" : 1 ,
39+ "num_channels" : 16
40+ }
41+ ],
42+ "compilation" :
43+ {
44+ "onnx_path" : null ,
45+ "compile_dir" : null ,
46+ "mdp_ts_num_devices" : 8 ,
47+ "mxfp6_matmul" : false ,
48+ "convert_to_fp16" : true ,
49+ "aic_num_cores" : 16 ,
50+ "aic-enable-depth-first" : true ,
51+ "compile_only" :true ,
52+ "mos" : 1 ,
53+ "mdts_mos" : 1
54+ },
55+ "execute" :
56+ {
57+ "device_ids" : null
58+ }
59+ }
3560 }
3661}
Original file line number Diff line number Diff line change @@ -760,7 +760,7 @@ def __call__(
760760 inputs = {"latent_sample" : latents .numpy ()}
761761
762762 start_decode_time = time .perf_counter ()
763- video = self .vae_decoder .qpc_session .run (inputs ) # CPU fallback
763+ video = self .vae_decoder .qpc_session .run (inputs )
764764 end_decode_time = time .perf_counter ()
765765 vae_decoder_perf = end_decode_time - start_decode_time
766766
Original file line number Diff line number Diff line change 33 "model_type" : " wan" ,
44 "modules" : {
55 "transformer" : {
6- "specializations" : [
7- {
8- "batch_size" : " 1" ,
9- "num_channels" : " 16" ,
10- "steps" : " 1" ,
11- "sequence_length" : " 512" ,
12- "model_type" : 1
13- },
14- {
15- "batch_size" : " 1" ,
16- "num_channels" : " 16" ,
17- "steps" : " 1" ,
18- "sequence_length" : " 512" ,
19- "model_type" : 2
20- }
21- ],
22- "compilation" : {
23- "onnx_path" : null ,
24- "compile_dir" : null ,
25- "mdp_ts_num_devices" : 16 ,
26- "mxfp6_matmul" : true ,
27- "convert_to_fp16" : true ,
28- "aic_num_cores" : 16 ,
29- "mos" : 1 ,
30- "mdts_mos" : 1
31- },
32- "execute" : {
33- "device_ids" : null
34- }
35- },
36- "vae_decoder" :
37- {
38- "specializations" : [
39- {
40- "batch_size" : 1 ,
41- "num_channels" : 16 ,
42- "num_frames" : 21 ,
43- "latent_height" : 60 ,
44- "latent_width" : 104
45- }
46- ],
47- "compilation" :
6+ "specializations" : [
487 {
49- "onnx_path" : null ,
50- "compile_dir" : null ,
51- "mdp_ts_num_devices" : 8 ,
52- "mxfp6_matmul" : false ,
53- "convert_to_fp16" : true ,
54- "aic_num_cores" : 16 ,
55- "aic-enable-depth-first" : true ,
56- "compile_only" :true ,
57- "mos" : 1 ,
58- "mdts_mos" : 1
8+ "batch_size" : " 1" ,
9+ "num_channels" : " 16" ,
10+ "steps" : " 1" ,
11+ "sequence_length" : " 512" ,
12+ "model_type" : 1
5913 },
60- "execute" :
6114 {
62- "device_ids" : null
15+ "batch_size" : " 1" ,
16+ "num_channels" : " 16" ,
17+ "steps" : " 1" ,
18+ "sequence_length" : " 512" ,
19+ "model_type" : 2
20+ }
21+ ],
22+ "compilation" : {
23+ "onnx_path" : null ,
24+ "compile_dir" : null ,
25+ "mdp_ts_num_devices" : 16 ,
26+ "mxfp6_matmul" : true ,
27+ "convert_to_fp16" : true ,
28+ "aic_num_cores" : 16 ,
29+ "mos" : 1 ,
30+ "mdts_mos" : 1
31+ },
32+ "execute" : {
33+ "device_ids" : null
34+ }
35+ },
36+ "vae_decoder" :
37+ {
38+ "specializations" : [
39+ {
40+ "batch_size" : 1 ,
41+ "num_channels" : 16
6342 }
64- }
43+ ],
44+ "compilation" :
45+ {
46+ "onnx_path" : null ,
47+ "compile_dir" : null ,
48+ "mdp_ts_num_devices" : 8 ,
49+ "mxfp6_matmul" : false ,
50+ "convert_to_fp16" : true ,
51+ "aic_num_cores" : 16 ,
52+ "aic-enable-depth-first" : true ,
53+ "compile_only" :true ,
54+ "mos" : 1 ,
55+ "mdts_mos" : 1
56+ },
57+ "execute" :
58+ {
59+ "device_ids" : null
60+ }
61+ }
6562
6663 }
6764}
You can’t perform that action at this time.
0 commit comments