lym00's picture
Upload nvfp4-fast.yaml
53edc18 verified
raw
history blame contribute delete
746 Bytes
quant:
smooth:
proj:
num_grids: 10
calib:
num_samples: 32
path: datasets/torch.bfloat16/flux.1-kontext-dev/fmeuler8-g1/qdiff/s32
wgts:
dtype: sfp4_e2m1_all
group_shapes:
- - -1
- -1
- - 1
- 16
- 1
- 1
- 1
scale_dtypes:
- null
- sfp8_e4m3_nan
ipts:
static: false
dtype: sfp4_e2m1_all
group_shapes:
- - 1
- 16
- 1
- 1
- 1
scale_dtypes:
- sfp8_e4m3_nan
enable_extra_wgts: true
extra_wgts:
dtype: sint4
group_shapes:
- - 1
- 64
- 1
- 1
- 1
scale_dtypes:
- null
includes:
- transformer_norm
- transformer_add_norm