thu-nics
diff --git a/‎examples/opensora1.2/configs/config.yaml‎
Lines changed: 25 additions & 1 deletion b/‎examples/opensora1.2/configs/config.yaml‎
Lines changed: 25 additions & 1 deletion
diff --git a/‎examples/opensora1.2/configs/sample.py‎
Lines changed: 3 additions & 3 deletions b/‎examples/opensora1.2/configs/sample.py‎
Lines changed: 3 additions & 3 deletions
@@ -1,6 +1,7 @@
 model:
     model_id: "opensora"
     model_type: 'opensora'  # ['sd','sdxl']
+remain_fp_regex: embedder|adaLN_modulation|t_block
 calib_data:
 weight:
   n_bits: 8
@@ -10,5 +11,28 @@ act:
   n_bits: 8
   group: 'token' # DIRTY: it is not used, forced as "token-wise"
   sym: True
-remain_fp_regex: embedder|adaLN_modulation|t_block
+attn:
+    qk:
+        n_bits: 8
+        reorder_file_path: 
+    v:
+        n_bits: 8
+    attn_map:  # V*attn_map_post_softmax quantized
+        n_bits: 8
+        sym: True
+        group: 'row'
+        # level_2: True
+        # int8_scale: False
+        # mixed_precision_cfg_path: './visualization/attn_map_mixed_precision.pt'
+cross_attn:
+    q:
+      n_bits: 8
+      sym: True
+    kv:
+      n_bits: 8
+      sym: True
+    # attn_map:
+    #   n_bits: 8
+    #   sym: True
+
 
@@ -5,8 +5,8 @@
 frame_interval = 1
 save_fps = 24
 ptq_config='./configs/config.yaml'
-save_dir = "./logs/int8_linear"
-seed = 1024
+save_dir = "./logs/attn_int8_naive"
+seed = 114514
 batch_size = 1
 multi_resolution = "STDiT2"
 dtype = "bf16"
@@ -18,7 +18,7 @@
     # from_pretrained="/share/public/zhuhongyu/hpcai-tech/OpenSora-STDiT-v3",
     from_pretrained="/home/zhaotianchen/models/hpcai-tech/OpenSora-STDiT-v3",
     qk_norm=True,
-    enable_flash_attn=True,
+    enable_flash_attn=False,
     enable_layernorm_kernel=False,  # didnot install apex
 )
 vae = dict(