BOAST 1.3.4 → 1.3.5

Sign up to get free protection for your applications and to get access to all the features.
@@ -1,5 +1,5 @@
1
1
  module BOAST
2
- X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
2
+ X86CPUID_by_name = {"_m_from_int64"=>["MMX"],
3
3
  "_m_to_int64"=>["MMX"],
4
4
  "_m_empty"=>["MMX"],
5
5
  "_m_from_int"=>["MMX"],
@@ -134,7 +134,7 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
134
134
  "_MM_SET_ROUNDING_MODE"=>["SSE"],
135
135
  "_MM_GET_FLUSH_ZERO_MODE"=>["SSE"],
136
136
  "_MM_SET_FLUSH_ZERO_MODE"=>["SSE"],
137
- "_mm_prefetch"=>["PREFETCHWT1"],
137
+ "_mm_prefetch"=>["PREFETCHW"],
138
138
  "_mm_sfence"=>["SSE"],
139
139
  "_mm_max_pi16"=>["SSE"],
140
140
  "_m_pmaxsw"=>["SSE"],
@@ -1338,8 +1338,8 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
1338
1338
  "_xrstor64"=>["XSAVE"],
1339
1339
  "_xsave"=>["XSAVE"],
1340
1340
  "_xsave64"=>["XSAVE"],
1341
- "_xsaveopt"=>["XSAVE", "XSAVEOPT"],
1342
- "_xsaveopt64"=>["XSAVE", "XSAVEOPT"],
1341
+ "_xsaveopt"=>[["XSAVE", "XSAVEOPT"]],
1342
+ "_xsaveopt64"=>[["XSAVE", "XSAVEOPT"]],
1343
1343
  "_xsetbv"=>["XSAVE"],
1344
1344
  "_mm_loadu_si32"=>nil,
1345
1345
  "_mm_storeu_si32"=>nil,
@@ -1392,12 +1392,12 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
1392
1392
  "_storebe_i16"=>nil,
1393
1393
  "_storebe_i32"=>nil,
1394
1394
  "_storebe_i64"=>nil,
1395
- "_xsavec"=>["XSAVE", "XSAVEC"],
1396
- "_xsaves"=>["XSAVE", "XSS"],
1397
- "_xsavec64"=>["XSAVE", "XSAVEC"],
1398
- "_xsaves64"=>["XSAVE", "XSS"],
1399
- "_xrstors"=>["XSAVE", "XSS"],
1400
- "_xrstors64"=>["XSAVE", "XSS"],
1395
+ "_xsavec"=>[["XSAVE", "XSAVEC"]],
1396
+ "_xsaves"=>[["XSAVE", "XSS"]],
1397
+ "_xsavec64"=>[["XSAVE", "XSAVEC"]],
1398
+ "_xsaves64"=>[["XSAVE", "XSS"]],
1399
+ "_xrstors"=>[["XSAVE", "XSS"]],
1400
+ "_xrstors64"=>[["XSAVE", "XSS"]],
1401
1401
  "_mm512_kandn"=>["KNCNI"],
1402
1402
  "_mm512_kand"=>["KNCNI"],
1403
1403
  "_mm512_kmov"=>["KNCNI"],
@@ -3278,8 +3278,8 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
3278
3278
  "_mm512_kswapb"=>["KNCNI"],
3279
3279
  "_mm512_kortestz"=>["AVX512F"],
3280
3280
  "_mm512_kortestc"=>["AVX512F"],
3281
- "_mm512_mask2int"=>["KNCNI"],
3282
- "_mm512_int2mask"=>["KNCNI"],
3281
+ "_mm512_mask2int"=>["AVX512F"],
3282
+ "_mm512_int2mask"=>["AVX512F"],
3283
3283
  "_mm512_kconcathi_64"=>["KNCNI"],
3284
3284
  "_mm512_kconcatlo_64"=>["KNCNI"],
3285
3285
  "_mm512_kextract_64"=>["KNCNI"],
@@ -3323,903 +3323,903 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
3323
3323
  "_mm512_kmerge2l1l"=>["KNCNI"],
3324
3324
  "_mm512_kunpackd"=>["AVX512BW"],
3325
3325
  "_mm512_kunpackw"=>["AVX512BW"],
3326
- "_mm256_mask_add_pd"=>["AVX512F", "AVX512VL"],
3327
- "_mm256_maskz_add_pd"=>["AVX512F", "AVX512VL"],
3328
- "_mm_mask_add_pd"=>["AVX512F", "AVX512VL"],
3329
- "_mm_maskz_add_pd"=>["AVX512F", "AVX512VL"],
3330
- "_mm256_mask_add_ps"=>["AVX512F", "AVX512VL"],
3331
- "_mm256_maskz_add_ps"=>["AVX512F", "AVX512VL"],
3332
- "_mm_mask_add_ps"=>["AVX512F", "AVX512VL"],
3333
- "_mm_maskz_add_ps"=>["AVX512F", "AVX512VL"],
3334
- "_mm256_alignr_epi32"=>["AVX512F", "AVX512VL"],
3335
- "_mm256_mask_alignr_epi32"=>["AVX512F", "AVX512VL"],
3336
- "_mm256_maskz_alignr_epi32"=>["AVX512F", "AVX512VL"],
3337
- "_mm_alignr_epi32"=>["AVX512F", "AVX512VL"],
3338
- "_mm_mask_alignr_epi32"=>["AVX512F", "AVX512VL"],
3339
- "_mm_maskz_alignr_epi32"=>["AVX512F", "AVX512VL"],
3340
- "_mm256_alignr_epi64"=>["AVX512F", "AVX512VL"],
3341
- "_mm256_mask_alignr_epi64"=>["AVX512F", "AVX512VL"],
3342
- "_mm256_maskz_alignr_epi64"=>["AVX512F", "AVX512VL"],
3343
- "_mm_alignr_epi64"=>["AVX512F", "AVX512VL"],
3344
- "_mm_mask_alignr_epi64"=>["AVX512F", "AVX512VL"],
3345
- "_mm_maskz_alignr_epi64"=>["AVX512F", "AVX512VL"],
3346
- "_mm256_mask_andnot_pd"=>["AVX512VL", "AVX512DQ"],
3347
- "_mm256_maskz_andnot_pd"=>["AVX512VL", "AVX512DQ"],
3326
+ "_mm256_mask_add_pd"=>[["AVX512F", "AVX512VL"]],
3327
+ "_mm256_maskz_add_pd"=>[["AVX512F", "AVX512VL"]],
3328
+ "_mm_mask_add_pd"=>[["AVX512F", "AVX512VL"]],
3329
+ "_mm_maskz_add_pd"=>[["AVX512F", "AVX512VL"]],
3330
+ "_mm256_mask_add_ps"=>[["AVX512F", "AVX512VL"]],
3331
+ "_mm256_maskz_add_ps"=>[["AVX512F", "AVX512VL"]],
3332
+ "_mm_mask_add_ps"=>[["AVX512F", "AVX512VL"]],
3333
+ "_mm_maskz_add_ps"=>[["AVX512F", "AVX512VL"]],
3334
+ "_mm256_alignr_epi32"=>[["AVX512F", "AVX512VL"]],
3335
+ "_mm256_mask_alignr_epi32"=>[["AVX512F", "AVX512VL"]],
3336
+ "_mm256_maskz_alignr_epi32"=>[["AVX512F", "AVX512VL"]],
3337
+ "_mm_alignr_epi32"=>[["AVX512F", "AVX512VL"]],
3338
+ "_mm_mask_alignr_epi32"=>[["AVX512F", "AVX512VL"]],
3339
+ "_mm_maskz_alignr_epi32"=>[["AVX512F", "AVX512VL"]],
3340
+ "_mm256_alignr_epi64"=>[["AVX512F", "AVX512VL"]],
3341
+ "_mm256_mask_alignr_epi64"=>[["AVX512F", "AVX512VL"]],
3342
+ "_mm256_maskz_alignr_epi64"=>[["AVX512F", "AVX512VL"]],
3343
+ "_mm_alignr_epi64"=>[["AVX512F", "AVX512VL"]],
3344
+ "_mm_mask_alignr_epi64"=>[["AVX512F", "AVX512VL"]],
3345
+ "_mm_maskz_alignr_epi64"=>[["AVX512F", "AVX512VL"]],
3346
+ "_mm256_mask_andnot_pd"=>[["AVX512VL", "AVX512DQ"]],
3347
+ "_mm256_maskz_andnot_pd"=>[["AVX512VL", "AVX512DQ"]],
3348
3348
  "_mm512_andnot_pd"=>["AVX512DQ"],
3349
3349
  "_mm512_mask_andnot_pd"=>["AVX512DQ"],
3350
3350
  "_mm512_maskz_andnot_pd"=>["AVX512DQ"],
3351
- "_mm_mask_andnot_pd"=>["AVX512VL", "AVX512DQ"],
3352
- "_mm_maskz_andnot_pd"=>["AVX512VL", "AVX512DQ"],
3353
- "_mm256_mask_andnot_ps"=>["AVX512VL", "AVX512DQ"],
3354
- "_mm256_maskz_andnot_ps"=>["AVX512VL", "AVX512DQ"],
3351
+ "_mm_mask_andnot_pd"=>[["AVX512VL", "AVX512DQ"]],
3352
+ "_mm_maskz_andnot_pd"=>[["AVX512VL", "AVX512DQ"]],
3353
+ "_mm256_mask_andnot_ps"=>[["AVX512VL", "AVX512DQ"]],
3354
+ "_mm256_maskz_andnot_ps"=>[["AVX512VL", "AVX512DQ"]],
3355
3355
  "_mm512_andnot_ps"=>["AVX512DQ"],
3356
3356
  "_mm512_mask_andnot_ps"=>["AVX512DQ"],
3357
3357
  "_mm512_maskz_andnot_ps"=>["AVX512DQ"],
3358
- "_mm_mask_andnot_ps"=>["AVX512VL", "AVX512DQ"],
3359
- "_mm_maskz_andnot_ps"=>["AVX512VL", "AVX512DQ"],
3360
- "_mm256_mask_and_pd"=>["AVX512VL", "AVX512DQ"],
3361
- "_mm256_maskz_and_pd"=>["AVX512VL", "AVX512DQ"],
3358
+ "_mm_mask_andnot_ps"=>[["AVX512VL", "AVX512DQ"]],
3359
+ "_mm_maskz_andnot_ps"=>[["AVX512VL", "AVX512DQ"]],
3360
+ "_mm256_mask_and_pd"=>[["AVX512VL", "AVX512DQ"]],
3361
+ "_mm256_maskz_and_pd"=>[["AVX512VL", "AVX512DQ"]],
3362
3362
  "_mm512_and_pd"=>["AVX512DQ"],
3363
3363
  "_mm512_mask_and_pd"=>["AVX512DQ"],
3364
3364
  "_mm512_maskz_and_pd"=>["AVX512DQ"],
3365
- "_mm_mask_and_pd"=>["AVX512VL", "AVX512DQ"],
3366
- "_mm_maskz_and_pd"=>["AVX512VL", "AVX512DQ"],
3367
- "_mm256_mask_and_ps"=>["AVX512VL", "AVX512DQ"],
3368
- "_mm256_maskz_and_ps"=>["AVX512VL", "AVX512DQ"],
3365
+ "_mm_mask_and_pd"=>[["AVX512VL", "AVX512DQ"]],
3366
+ "_mm_maskz_and_pd"=>[["AVX512VL", "AVX512DQ"]],
3367
+ "_mm256_mask_and_ps"=>[["AVX512VL", "AVX512DQ"]],
3368
+ "_mm256_maskz_and_ps"=>[["AVX512VL", "AVX512DQ"]],
3369
3369
  "_mm512_and_ps"=>["AVX512DQ"],
3370
3370
  "_mm512_mask_and_ps"=>["AVX512DQ"],
3371
3371
  "_mm512_maskz_and_ps"=>["AVX512DQ"],
3372
- "_mm_mask_and_ps"=>["AVX512VL", "AVX512DQ"],
3373
- "_mm_maskz_and_ps"=>["AVX512VL", "AVX512DQ"],
3374
- "_mm256_mask_blend_pd"=>["AVX512VL", "AVX512F"],
3375
- "_mm_mask_blend_pd"=>["AVX512VL", "AVX512F"],
3376
- "_mm256_mask_blend_ps"=>["AVX512VL", "AVX512F"],
3377
- "_mm_mask_blend_ps"=>["AVX512VL", "AVX512F"],
3378
- "_mm256_broadcast_f32x2"=>["AVX512VL", "AVX512DQ"],
3379
- "_mm256_mask_broadcast_f32x2"=>["AVX512VL", "AVX512DQ"],
3380
- "_mm256_maskz_broadcast_f32x2"=>["AVX512VL", "AVX512DQ"],
3372
+ "_mm_mask_and_ps"=>[["AVX512VL", "AVX512DQ"]],
3373
+ "_mm_maskz_and_ps"=>[["AVX512VL", "AVX512DQ"]],
3374
+ "_mm256_mask_blend_pd"=>[["AVX512VL", "AVX512F"]],
3375
+ "_mm_mask_blend_pd"=>[["AVX512VL", "AVX512F"]],
3376
+ "_mm256_mask_blend_ps"=>[["AVX512VL", "AVX512F"]],
3377
+ "_mm_mask_blend_ps"=>[["AVX512VL", "AVX512F"]],
3378
+ "_mm256_broadcast_f32x2"=>[["AVX512VL", "AVX512DQ"]],
3379
+ "_mm256_mask_broadcast_f32x2"=>[["AVX512VL", "AVX512DQ"]],
3380
+ "_mm256_maskz_broadcast_f32x2"=>[["AVX512VL", "AVX512DQ"]],
3381
3381
  "_mm512_broadcast_f32x2"=>["AVX512DQ"],
3382
3382
  "_mm512_mask_broadcast_f32x2"=>["AVX512DQ"],
3383
3383
  "_mm512_maskz_broadcast_f32x2"=>["AVX512DQ"],
3384
- "_mm256_broadcast_f32x4"=>["AVX512VL", "AVX512F"],
3385
- "_mm256_mask_broadcast_f32x4"=>["AVX512VL", "AVX512F"],
3386
- "_mm256_maskz_broadcast_f32x4"=>["AVX512VL", "AVX512F"],
3384
+ "_mm256_broadcast_f32x4"=>[["AVX512VL", "AVX512F"]],
3385
+ "_mm256_mask_broadcast_f32x4"=>[["AVX512VL", "AVX512F"]],
3386
+ "_mm256_maskz_broadcast_f32x4"=>[["AVX512VL", "AVX512F"]],
3387
3387
  "_mm512_broadcast_f32x8"=>["AVX512DQ"],
3388
3388
  "_mm512_mask_broadcast_f32x8"=>["AVX512DQ"],
3389
3389
  "_mm512_maskz_broadcast_f32x8"=>["AVX512DQ"],
3390
- "_mm256_broadcast_f64x2"=>["AVX512VL", "AVX512DQ"],
3391
- "_mm256_mask_broadcast_f64x2"=>["AVX512VL", "AVX512DQ"],
3392
- "_mm256_maskz_broadcast_f64x2"=>["AVX512VL", "AVX512DQ"],
3390
+ "_mm256_broadcast_f64x2"=>[["AVX512VL", "AVX512DQ"]],
3391
+ "_mm256_mask_broadcast_f64x2"=>[["AVX512VL", "AVX512DQ"]],
3392
+ "_mm256_maskz_broadcast_f64x2"=>[["AVX512VL", "AVX512DQ"]],
3393
3393
  "_mm512_broadcast_f64x2"=>["AVX512DQ"],
3394
3394
  "_mm512_mask_broadcast_f64x2"=>["AVX512DQ"],
3395
3395
  "_mm512_maskz_broadcast_f64x2"=>["AVX512DQ"],
3396
- "_mm256_broadcast_i32x2"=>["AVX512VL", "AVX512DQ"],
3397
- "_mm256_mask_broadcast_i32x2"=>["AVX512VL", "AVX512DQ"],
3398
- "_mm256_maskz_broadcast_i32x2"=>["AVX512VL", "AVX512DQ"],
3396
+ "_mm256_broadcast_i32x2"=>[["AVX512VL", "AVX512DQ"]],
3397
+ "_mm256_mask_broadcast_i32x2"=>[["AVX512VL", "AVX512DQ"]],
3398
+ "_mm256_maskz_broadcast_i32x2"=>[["AVX512VL", "AVX512DQ"]],
3399
3399
  "_mm512_broadcast_i32x2"=>["AVX512DQ"],
3400
3400
  "_mm512_mask_broadcast_i32x2"=>["AVX512DQ"],
3401
3401
  "_mm512_maskz_broadcast_i32x2"=>["AVX512DQ"],
3402
- "_mm_broadcast_i32x2"=>["AVX512VL", "AVX512DQ"],
3403
- "_mm_mask_broadcast_i32x2"=>["AVX512VL", "AVX512DQ"],
3404
- "_mm_maskz_broadcast_i32x2"=>["AVX512VL", "AVX512DQ"],
3405
- "_mm256_broadcast_i32x4"=>["AVX512VL", "AVX512F"],
3406
- "_mm256_mask_broadcast_i32x4"=>["AVX512VL", "AVX512F"],
3407
- "_mm256_maskz_broadcast_i32x4"=>["AVX512VL", "AVX512F"],
3402
+ "_mm_broadcast_i32x2"=>[["AVX512VL", "AVX512DQ"]],
3403
+ "_mm_mask_broadcast_i32x2"=>[["AVX512VL", "AVX512DQ"]],
3404
+ "_mm_maskz_broadcast_i32x2"=>[["AVX512VL", "AVX512DQ"]],
3405
+ "_mm256_broadcast_i32x4"=>[["AVX512VL", "AVX512F"]],
3406
+ "_mm256_mask_broadcast_i32x4"=>[["AVX512VL", "AVX512F"]],
3407
+ "_mm256_maskz_broadcast_i32x4"=>[["AVX512VL", "AVX512F"]],
3408
3408
  "_mm512_broadcast_i32x8"=>["AVX512DQ"],
3409
3409
  "_mm512_mask_broadcast_i32x8"=>["AVX512DQ"],
3410
3410
  "_mm512_maskz_broadcast_i32x8"=>["AVX512DQ"],
3411
- "_mm256_broadcast_i64x2"=>["AVX512VL", "AVX512DQ"],
3412
- "_mm256_mask_broadcast_i64x2"=>["AVX512VL", "AVX512DQ"],
3413
- "_mm256_maskz_broadcast_i64x2"=>["AVX512VL", "AVX512DQ"],
3411
+ "_mm256_broadcast_i64x2"=>[["AVX512VL", "AVX512DQ"]],
3412
+ "_mm256_mask_broadcast_i64x2"=>[["AVX512VL", "AVX512DQ"]],
3413
+ "_mm256_maskz_broadcast_i64x2"=>[["AVX512VL", "AVX512DQ"]],
3414
3414
  "_mm512_broadcast_i64x2"=>["AVX512DQ"],
3415
3415
  "_mm512_mask_broadcast_i64x2"=>["AVX512DQ"],
3416
3416
  "_mm512_maskz_broadcast_i64x2"=>["AVX512DQ"],
3417
- "_mm256_mask_broadcastsd_pd"=>["AVX512VL", "AVX512F"],
3418
- "_mm256_maskz_broadcastsd_pd"=>["AVX512VL", "AVX512F"],
3419
- "_mm256_mask_broadcastss_ps"=>["AVX512VL", "AVX512F"],
3420
- "_mm256_maskz_broadcastss_ps"=>["AVX512VL", "AVX512F"],
3421
- "_mm_mask_broadcastss_ps"=>["AVX512VL", "AVX512F"],
3422
- "_mm_maskz_broadcastss_ps"=>["AVX512VL", "AVX512F"],
3423
- "_mm256_cmp_pd_mask"=>["AVX512VL", "AVX512F"],
3424
- "_mm256_mask_cmp_pd_mask"=>["AVX512VL", "AVX512F"],
3425
- "_mm_cmp_pd_mask"=>["AVX512VL", "AVX512F"],
3426
- "_mm_mask_cmp_pd_mask"=>["AVX512VL", "AVX512F"],
3427
- "_mm256_cmp_ps_mask"=>["AVX512VL", "AVX512F"],
3428
- "_mm256_mask_cmp_ps_mask"=>["AVX512VL", "AVX512F"],
3429
- "_mm_cmp_ps_mask"=>["AVX512VL", "AVX512F"],
3430
- "_mm_mask_cmp_ps_mask"=>["AVX512VL", "AVX512F"],
3431
- "_mm256_mask_compress_pd"=>["AVX512VL", "AVX512F"],
3432
- "_mm256_mask_compressstoreu_pd"=>["AVX512VL", "AVX512F"],
3433
- "_mm256_maskz_compress_pd"=>["AVX512VL", "AVX512F"],
3434
- "_mm_mask_compress_pd"=>["AVX512VL", "AVX512F"],
3435
- "_mm_mask_compressstoreu_pd"=>["AVX512VL", "AVX512F"],
3436
- "_mm_maskz_compress_pd"=>["AVX512VL", "AVX512F"],
3437
- "_mm256_mask_compress_ps"=>["AVX512VL", "AVX512F"],
3438
- "_mm256_mask_compressstoreu_ps"=>["AVX512VL", "AVX512F"],
3439
- "_mm256_maskz_compress_ps"=>["AVX512VL", "AVX512F"],
3440
- "_mm_mask_compress_ps"=>["AVX512VL", "AVX512F"],
3441
- "_mm_mask_compressstoreu_ps"=>["AVX512VL", "AVX512F"],
3442
- "_mm_maskz_compress_ps"=>["AVX512VL", "AVX512F"],
3443
- "_mm256_mask_cvtepi32_pd"=>["AVX512VL", "AVX512F"],
3444
- "_mm256_maskz_cvtepi32_pd"=>["AVX512VL", "AVX512F"],
3445
- "_mm_mask_cvtepi32_pd"=>["AVX512VL", "AVX512F"],
3446
- "_mm_maskz_cvtepi32_pd"=>["AVX512VL", "AVX512F"],
3447
- "_mm256_mask_cvtepi32_ps"=>["AVX512VL", "AVX512F"],
3448
- "_mm256_maskz_cvtepi32_ps"=>["AVX512VL", "AVX512F"],
3449
- "_mm_mask_cvtepi32_ps"=>["AVX512VL", "AVX512F"],
3450
- "_mm_maskz_cvtepi32_ps"=>["AVX512VL", "AVX512F"],
3451
- "_mm256_mask_cvtpd_epi32"=>["AVX512VL", "AVX512F"],
3452
- "_mm256_maskz_cvtpd_epi32"=>["AVX512VL", "AVX512F"],
3453
- "_mm_mask_cvtpd_epi32"=>["AVX512VL", "AVX512F"],
3454
- "_mm_maskz_cvtpd_epi32"=>["AVX512VL", "AVX512F"],
3455
- "_mm256_mask_cvtpd_ps"=>["AVX512VL", "AVX512F"],
3456
- "_mm256_maskz_cvtpd_ps"=>["AVX512VL", "AVX512F"],
3457
- "_mm_mask_cvtpd_ps"=>["AVX512VL", "AVX512F"],
3458
- "_mm_maskz_cvtpd_ps"=>["AVX512VL", "AVX512F"],
3459
- "_mm256_cvtpd_epi64"=>["AVX512VL", "AVX512DQ"],
3460
- "_mm256_mask_cvtpd_epi64"=>["AVX512VL", "AVX512DQ"],
3461
- "_mm256_maskz_cvtpd_epi64"=>["AVX512VL", "AVX512DQ"],
3417
+ "_mm256_mask_broadcastsd_pd"=>[["AVX512VL", "AVX512F"]],
3418
+ "_mm256_maskz_broadcastsd_pd"=>[["AVX512VL", "AVX512F"]],
3419
+ "_mm256_mask_broadcastss_ps"=>[["AVX512VL", "AVX512F"]],
3420
+ "_mm256_maskz_broadcastss_ps"=>[["AVX512VL", "AVX512F"]],
3421
+ "_mm_mask_broadcastss_ps"=>[["AVX512VL", "AVX512F"]],
3422
+ "_mm_maskz_broadcastss_ps"=>[["AVX512VL", "AVX512F"]],
3423
+ "_mm256_cmp_pd_mask"=>[["AVX512VL", "AVX512F"]],
3424
+ "_mm256_mask_cmp_pd_mask"=>[["AVX512VL", "AVX512F"]],
3425
+ "_mm_cmp_pd_mask"=>[["AVX512VL", "AVX512F"]],
3426
+ "_mm_mask_cmp_pd_mask"=>[["AVX512VL", "AVX512F"]],
3427
+ "_mm256_cmp_ps_mask"=>[["AVX512VL", "AVX512F"]],
3428
+ "_mm256_mask_cmp_ps_mask"=>[["AVX512VL", "AVX512F"]],
3429
+ "_mm_cmp_ps_mask"=>[["AVX512VL", "AVX512F"]],
3430
+ "_mm_mask_cmp_ps_mask"=>[["AVX512VL", "AVX512F"]],
3431
+ "_mm256_mask_compress_pd"=>[["AVX512VL", "AVX512F"]],
3432
+ "_mm256_mask_compressstoreu_pd"=>[["AVX512VL", "AVX512F"]],
3433
+ "_mm256_maskz_compress_pd"=>[["AVX512VL", "AVX512F"]],
3434
+ "_mm_mask_compress_pd"=>[["AVX512VL", "AVX512F"]],
3435
+ "_mm_mask_compressstoreu_pd"=>[["AVX512VL", "AVX512F"]],
3436
+ "_mm_maskz_compress_pd"=>[["AVX512VL", "AVX512F"]],
3437
+ "_mm256_mask_compress_ps"=>[["AVX512VL", "AVX512F"]],
3438
+ "_mm256_mask_compressstoreu_ps"=>[["AVX512VL", "AVX512F"]],
3439
+ "_mm256_maskz_compress_ps"=>[["AVX512VL", "AVX512F"]],
3440
+ "_mm_mask_compress_ps"=>[["AVX512VL", "AVX512F"]],
3441
+ "_mm_mask_compressstoreu_ps"=>[["AVX512VL", "AVX512F"]],
3442
+ "_mm_maskz_compress_ps"=>[["AVX512VL", "AVX512F"]],
3443
+ "_mm256_mask_cvtepi32_pd"=>[["AVX512VL", "AVX512F"]],
3444
+ "_mm256_maskz_cvtepi32_pd"=>[["AVX512VL", "AVX512F"]],
3445
+ "_mm_mask_cvtepi32_pd"=>[["AVX512VL", "AVX512F"]],
3446
+ "_mm_maskz_cvtepi32_pd"=>[["AVX512VL", "AVX512F"]],
3447
+ "_mm256_mask_cvtepi32_ps"=>[["AVX512VL", "AVX512F"]],
3448
+ "_mm256_maskz_cvtepi32_ps"=>[["AVX512VL", "AVX512F"]],
3449
+ "_mm_mask_cvtepi32_ps"=>[["AVX512VL", "AVX512F"]],
3450
+ "_mm_maskz_cvtepi32_ps"=>[["AVX512VL", "AVX512F"]],
3451
+ "_mm256_mask_cvtpd_epi32"=>[["AVX512VL", "AVX512F"]],
3452
+ "_mm256_maskz_cvtpd_epi32"=>[["AVX512VL", "AVX512F"]],
3453
+ "_mm_mask_cvtpd_epi32"=>[["AVX512VL", "AVX512F"]],
3454
+ "_mm_maskz_cvtpd_epi32"=>[["AVX512VL", "AVX512F"]],
3455
+ "_mm256_mask_cvtpd_ps"=>[["AVX512VL", "AVX512F"]],
3456
+ "_mm256_maskz_cvtpd_ps"=>[["AVX512VL", "AVX512F"]],
3457
+ "_mm_mask_cvtpd_ps"=>[["AVX512VL", "AVX512F"]],
3458
+ "_mm_maskz_cvtpd_ps"=>[["AVX512VL", "AVX512F"]],
3459
+ "_mm256_cvtpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3460
+ "_mm256_mask_cvtpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3461
+ "_mm256_maskz_cvtpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3462
3462
  "_mm512_cvt_roundpd_epi64"=>["AVX512DQ"],
3463
3463
  "_mm512_cvtpd_epi64"=>["AVX512DQ"],
3464
3464
  "_mm512_mask_cvt_roundpd_epi64"=>["AVX512DQ"],
3465
3465
  "_mm512_mask_cvtpd_epi64"=>["AVX512DQ"],
3466
3466
  "_mm512_maskz_cvt_roundpd_epi64"=>["AVX512DQ"],
3467
3467
  "_mm512_maskz_cvtpd_epi64"=>["AVX512DQ"],
3468
- "_mm_cvtpd_epi64"=>["AVX512VL", "AVX512DQ"],
3469
- "_mm_mask_cvtpd_epi64"=>["AVX512VL", "AVX512DQ"],
3470
- "_mm_maskz_cvtpd_epi64"=>["AVX512VL", "AVX512DQ"],
3471
- "_mm256_cvtpd_epu32"=>["AVX512VL", "AVX512F"],
3472
- "_mm256_mask_cvtpd_epu32"=>["AVX512VL", "AVX512F"],
3473
- "_mm256_maskz_cvtpd_epu32"=>["AVX512VL", "AVX512F"],
3474
- "_mm_cvtpd_epu32"=>["AVX512VL", "AVX512F"],
3475
- "_mm_mask_cvtpd_epu32"=>["AVX512VL", "AVX512F"],
3476
- "_mm_maskz_cvtpd_epu32"=>["AVX512VL", "AVX512F"],
3477
- "_mm256_cvtpd_epu64"=>["AVX512VL", "AVX512DQ"],
3478
- "_mm256_mask_cvtpd_epu64"=>["AVX512VL", "AVX512DQ"],
3479
- "_mm256_maskz_cvtpd_epu64"=>["AVX512VL", "AVX512DQ"],
3468
+ "_mm_cvtpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3469
+ "_mm_mask_cvtpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3470
+ "_mm_maskz_cvtpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3471
+ "_mm256_cvtpd_epu32"=>[["AVX512VL", "AVX512F"]],
3472
+ "_mm256_mask_cvtpd_epu32"=>[["AVX512VL", "AVX512F"]],
3473
+ "_mm256_maskz_cvtpd_epu32"=>[["AVX512VL", "AVX512F"]],
3474
+ "_mm_cvtpd_epu32"=>[["AVX512VL", "AVX512F"]],
3475
+ "_mm_mask_cvtpd_epu32"=>[["AVX512VL", "AVX512F"]],
3476
+ "_mm_maskz_cvtpd_epu32"=>[["AVX512VL", "AVX512F"]],
3477
+ "_mm256_cvtpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3478
+ "_mm256_mask_cvtpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3479
+ "_mm256_maskz_cvtpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3480
3480
  "_mm512_cvt_roundpd_epu64"=>["AVX512DQ"],
3481
3481
  "_mm512_cvtpd_epu64"=>["AVX512DQ"],
3482
3482
  "_mm512_mask_cvt_roundpd_epu64"=>["AVX512DQ"],
3483
3483
  "_mm512_mask_cvtpd_epu64"=>["AVX512DQ"],
3484
3484
  "_mm512_maskz_cvt_roundpd_epu64"=>["AVX512DQ"],
3485
3485
  "_mm512_maskz_cvtpd_epu64"=>["AVX512DQ"],
3486
- "_mm_cvtpd_epu64"=>["AVX512VL", "AVX512DQ"],
3487
- "_mm_mask_cvtpd_epu64"=>["AVX512VL", "AVX512DQ"],
3488
- "_mm_maskz_cvtpd_epu64"=>["AVX512VL", "AVX512DQ"],
3489
- "_mm256_mask_cvtph_ps"=>["AVX512VL", "AVX512F"],
3490
- "_mm256_maskz_cvtph_ps"=>["AVX512VL", "AVX512F"],
3491
- "_mm_mask_cvtph_ps"=>["AVX512VL", "AVX512F"],
3492
- "_mm_maskz_cvtph_ps"=>["AVX512VL", "AVX512F"],
3493
- "_mm256_mask_cvtps_epi32"=>["AVX512VL", "AVX512F"],
3494
- "_mm256_maskz_cvtps_epi32"=>["AVX512VL", "AVX512F"],
3495
- "_mm_mask_cvtps_epi32"=>["AVX512VL", "AVX512F"],
3496
- "_mm_maskz_cvtps_epi32"=>["AVX512VL", "AVX512F"],
3497
- "_mm256_mask_cvt_roundps_ph"=>["AVX512VL", "AVX512F"],
3498
- "_mm256_mask_cvtps_ph"=>["AVX512VL", "AVX512F"],
3499
- "_mm256_maskz_cvt_roundps_ph"=>["AVX512VL", "AVX512F"],
3500
- "_mm256_maskz_cvtps_ph"=>["AVX512VL", "AVX512F"],
3501
- "_mm_mask_cvt_roundps_ph"=>["AVX512VL", "AVX512F"],
3502
- "_mm_mask_cvtps_ph"=>["AVX512VL", "AVX512F"],
3503
- "_mm_maskz_cvt_roundps_ph"=>["AVX512VL", "AVX512F"],
3504
- "_mm_maskz_cvtps_ph"=>["AVX512VL", "AVX512F"],
3505
- "_mm256_cvtps_epi64"=>["AVX512VL", "AVX512DQ"],
3506
- "_mm256_mask_cvtps_epi64"=>["AVX512VL", "AVX512DQ"],
3507
- "_mm256_maskz_cvtps_epi64"=>["AVX512VL", "AVX512DQ"],
3486
+ "_mm_cvtpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3487
+ "_mm_mask_cvtpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3488
+ "_mm_maskz_cvtpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3489
+ "_mm256_mask_cvtph_ps"=>[["AVX512VL", "AVX512F"]],
3490
+ "_mm256_maskz_cvtph_ps"=>[["AVX512VL", "AVX512F"]],
3491
+ "_mm_mask_cvtph_ps"=>[["AVX512VL", "AVX512F"]],
3492
+ "_mm_maskz_cvtph_ps"=>[["AVX512VL", "AVX512F"]],
3493
+ "_mm256_mask_cvtps_epi32"=>[["AVX512VL", "AVX512F"]],
3494
+ "_mm256_maskz_cvtps_epi32"=>[["AVX512VL", "AVX512F"]],
3495
+ "_mm_mask_cvtps_epi32"=>[["AVX512VL", "AVX512F"]],
3496
+ "_mm_maskz_cvtps_epi32"=>[["AVX512VL", "AVX512F"]],
3497
+ "_mm256_mask_cvt_roundps_ph"=>[["AVX512VL", "AVX512F"]],
3498
+ "_mm256_mask_cvtps_ph"=>[["AVX512VL", "AVX512F"]],
3499
+ "_mm256_maskz_cvt_roundps_ph"=>[["AVX512VL", "AVX512F"]],
3500
+ "_mm256_maskz_cvtps_ph"=>[["AVX512VL", "AVX512F"]],
3501
+ "_mm_mask_cvt_roundps_ph"=>[["AVX512VL", "AVX512F"]],
3502
+ "_mm_mask_cvtps_ph"=>[["AVX512VL", "AVX512F"]],
3503
+ "_mm_maskz_cvt_roundps_ph"=>[["AVX512VL", "AVX512F"]],
3504
+ "_mm_maskz_cvtps_ph"=>[["AVX512VL", "AVX512F"]],
3505
+ "_mm256_cvtps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3506
+ "_mm256_mask_cvtps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3507
+ "_mm256_maskz_cvtps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3508
3508
  "_mm512_cvt_roundps_epi64"=>["AVX512DQ"],
3509
3509
  "_mm512_cvtps_epi64"=>["AVX512DQ"],
3510
3510
  "_mm512_mask_cvt_roundps_epi64"=>["AVX512DQ"],
3511
3511
  "_mm512_mask_cvtps_epi64"=>["AVX512DQ"],
3512
3512
  "_mm512_maskz_cvt_roundps_epi64"=>["AVX512DQ"],
3513
3513
  "_mm512_maskz_cvtps_epi64"=>["AVX512DQ"],
3514
- "_mm_cvtps_epi64"=>["AVX512VL", "AVX512DQ"],
3515
- "_mm_mask_cvtps_epi64"=>["AVX512VL", "AVX512DQ"],
3516
- "_mm_maskz_cvtps_epi64"=>["AVX512VL", "AVX512DQ"],
3517
- "_mm256_cvtps_epu32"=>["AVX512VL", "AVX512F"],
3518
- "_mm256_mask_cvtps_epu32"=>["AVX512VL", "AVX512F"],
3519
- "_mm256_maskz_cvtps_epu32"=>["AVX512VL", "AVX512F"],
3520
- "_mm_cvtps_epu32"=>["AVX512VL", "AVX512F"],
3521
- "_mm_mask_cvtps_epu32"=>["AVX512VL", "AVX512F"],
3522
- "_mm_maskz_cvtps_epu32"=>["AVX512VL", "AVX512F"],
3523
- "_mm256_cvtps_epu64"=>["AVX512VL", "AVX512DQ"],
3524
- "_mm256_mask_cvtps_epu64"=>["AVX512VL", "AVX512DQ"],
3525
- "_mm256_maskz_cvtps_epu64"=>["AVX512VL", "AVX512DQ"],
3514
+ "_mm_cvtps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3515
+ "_mm_mask_cvtps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3516
+ "_mm_maskz_cvtps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3517
+ "_mm256_cvtps_epu32"=>[["AVX512VL", "AVX512F"]],
3518
+ "_mm256_mask_cvtps_epu32"=>[["AVX512VL", "AVX512F"]],
3519
+ "_mm256_maskz_cvtps_epu32"=>[["AVX512VL", "AVX512F"]],
3520
+ "_mm_cvtps_epu32"=>[["AVX512VL", "AVX512F"]],
3521
+ "_mm_mask_cvtps_epu32"=>[["AVX512VL", "AVX512F"]],
3522
+ "_mm_maskz_cvtps_epu32"=>[["AVX512VL", "AVX512F"]],
3523
+ "_mm256_cvtps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3524
+ "_mm256_mask_cvtps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3525
+ "_mm256_maskz_cvtps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3526
3526
  "_mm512_cvt_roundps_epu64"=>["AVX512DQ"],
3527
3527
  "_mm512_cvtps_epu64"=>["AVX512DQ"],
3528
3528
  "_mm512_mask_cvt_roundps_epu64"=>["AVX512DQ"],
3529
3529
  "_mm512_mask_cvtps_epu64"=>["AVX512DQ"],
3530
3530
  "_mm512_maskz_cvt_roundps_epu64"=>["AVX512DQ"],
3531
3531
  "_mm512_maskz_cvtps_epu64"=>["AVX512DQ"],
3532
- "_mm_cvtps_epu64"=>["AVX512VL", "AVX512DQ"],
3533
- "_mm_mask_cvtps_epu64"=>["AVX512VL", "AVX512DQ"],
3534
- "_mm_maskz_cvtps_epu64"=>["AVX512VL", "AVX512DQ"],
3535
- "_mm256_cvtepi64_pd"=>["AVX512VL", "AVX512DQ"],
3536
- "_mm256_mask_cvtepi64_pd"=>["AVX512VL", "AVX512DQ"],
3537
- "_mm256_maskz_cvtepi64_pd"=>["AVX512VL", "AVX512DQ"],
3532
+ "_mm_cvtps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3533
+ "_mm_mask_cvtps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3534
+ "_mm_maskz_cvtps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3535
+ "_mm256_cvtepi64_pd"=>[["AVX512VL", "AVX512DQ"]],
3536
+ "_mm256_mask_cvtepi64_pd"=>[["AVX512VL", "AVX512DQ"]],
3537
+ "_mm256_maskz_cvtepi64_pd"=>[["AVX512VL", "AVX512DQ"]],
3538
3538
  "_mm512_cvt_roundepi64_pd"=>["AVX512DQ"],
3539
3539
  "_mm512_cvtepi64_pd"=>["AVX512DQ"],
3540
3540
  "_mm512_mask_cvt_roundepi64_pd"=>["AVX512DQ"],
3541
3541
  "_mm512_mask_cvtepi64_pd"=>["AVX512DQ"],
3542
3542
  "_mm512_maskz_cvt_roundepi64_pd"=>["AVX512DQ"],
3543
3543
  "_mm512_maskz_cvtepi64_pd"=>["AVX512DQ"],
3544
- "_mm_cvtepi64_pd"=>["AVX512VL", "AVX512DQ"],
3545
- "_mm_mask_cvtepi64_pd"=>["AVX512VL", "AVX512DQ"],
3546
- "_mm_maskz_cvtepi64_pd"=>["AVX512VL", "AVX512DQ"],
3547
- "_mm256_cvtepi64_ps"=>["AVX512VL", "AVX512DQ"],
3548
- "_mm256_mask_cvtepi64_ps"=>["AVX512VL", "AVX512DQ"],
3549
- "_mm256_maskz_cvtepi64_ps"=>["AVX512VL", "AVX512DQ"],
3544
+ "_mm_cvtepi64_pd"=>[["AVX512VL", "AVX512DQ"]],
3545
+ "_mm_mask_cvtepi64_pd"=>[["AVX512VL", "AVX512DQ"]],
3546
+ "_mm_maskz_cvtepi64_pd"=>[["AVX512VL", "AVX512DQ"]],
3547
+ "_mm256_cvtepi64_ps"=>[["AVX512VL", "AVX512DQ"]],
3548
+ "_mm256_mask_cvtepi64_ps"=>[["AVX512VL", "AVX512DQ"]],
3549
+ "_mm256_maskz_cvtepi64_ps"=>[["AVX512VL", "AVX512DQ"]],
3550
3550
  "_mm512_cvt_roundepi64_ps"=>["AVX512DQ"],
3551
3551
  "_mm512_cvtepi64_ps"=>["AVX512DQ"],
3552
3552
  "_mm512_mask_cvt_roundepi64_ps"=>["AVX512DQ"],
3553
3553
  "_mm512_mask_cvtepi64_ps"=>["AVX512DQ"],
3554
3554
  "_mm512_maskz_cvt_roundepi64_ps"=>["AVX512DQ"],
3555
3555
  "_mm512_maskz_cvtepi64_ps"=>["AVX512DQ"],
3556
- "_mm_cvtepi64_ps"=>["AVX512VL", "AVX512DQ"],
3557
- "_mm_mask_cvtepi64_ps"=>["AVX512VL", "AVX512DQ"],
3558
- "_mm_maskz_cvtepi64_ps"=>["AVX512VL", "AVX512DQ"],
3559
- "_mm256_mask_cvttpd_epi32"=>["AVX512VL", "AVX512F"],
3560
- "_mm256_maskz_cvttpd_epi32"=>["AVX512VL", "AVX512F"],
3561
- "_mm_mask_cvttpd_epi32"=>["AVX512VL", "AVX512F"],
3562
- "_mm_maskz_cvttpd_epi32"=>["AVX512VL", "AVX512F"],
3563
- "_mm256_cvttpd_epi64"=>["AVX512VL", "AVX512DQ"],
3564
- "_mm256_mask_cvttpd_epi64"=>["AVX512VL", "AVX512DQ"],
3565
- "_mm256_maskz_cvttpd_epi64"=>["AVX512VL", "AVX512DQ"],
3556
+ "_mm_cvtepi64_ps"=>[["AVX512VL", "AVX512DQ"]],
3557
+ "_mm_mask_cvtepi64_ps"=>[["AVX512VL", "AVX512DQ"]],
3558
+ "_mm_maskz_cvtepi64_ps"=>[["AVX512VL", "AVX512DQ"]],
3559
+ "_mm256_mask_cvttpd_epi32"=>[["AVX512VL", "AVX512F"]],
3560
+ "_mm256_maskz_cvttpd_epi32"=>[["AVX512VL", "AVX512F"]],
3561
+ "_mm_mask_cvttpd_epi32"=>[["AVX512VL", "AVX512F"]],
3562
+ "_mm_maskz_cvttpd_epi32"=>[["AVX512VL", "AVX512F"]],
3563
+ "_mm256_cvttpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3564
+ "_mm256_mask_cvttpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3565
+ "_mm256_maskz_cvttpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3566
3566
  "_mm512_cvtt_roundpd_epi64"=>["AVX512DQ"],
3567
3567
  "_mm512_cvttpd_epi64"=>["AVX512DQ"],
3568
3568
  "_mm512_mask_cvtt_roundpd_epi64"=>["AVX512DQ"],
3569
3569
  "_mm512_mask_cvttpd_epi64"=>["AVX512DQ"],
3570
3570
  "_mm512_maskz_cvtt_roundpd_epi64"=>["AVX512DQ"],
3571
3571
  "_mm512_maskz_cvttpd_epi64"=>["AVX512DQ"],
3572
- "_mm_cvttpd_epi64"=>["AVX512VL", "AVX512DQ"],
3573
- "_mm_mask_cvttpd_epi64"=>["AVX512VL", "AVX512DQ"],
3574
- "_mm_maskz_cvttpd_epi64"=>["AVX512VL", "AVX512DQ"],
3575
- "_mm256_cvttpd_epu32"=>["AVX512VL", "AVX512F"],
3576
- "_mm256_mask_cvttpd_epu32"=>["AVX512VL", "AVX512F"],
3577
- "_mm256_maskz_cvttpd_epu32"=>["AVX512VL", "AVX512F"],
3578
- "_mm_cvttpd_epu32"=>["AVX512VL", "AVX512F"],
3579
- "_mm_mask_cvttpd_epu32"=>["AVX512VL", "AVX512F"],
3580
- "_mm_maskz_cvttpd_epu32"=>["AVX512VL", "AVX512F"],
3581
- "_mm256_cvttpd_epu64"=>["AVX512VL", "AVX512DQ"],
3582
- "_mm256_mask_cvttpd_epu64"=>["AVX512VL", "AVX512DQ"],
3583
- "_mm256_maskz_cvttpd_epu64"=>["AVX512VL", "AVX512DQ"],
3572
+ "_mm_cvttpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3573
+ "_mm_mask_cvttpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3574
+ "_mm_maskz_cvttpd_epi64"=>[["AVX512VL", "AVX512DQ"]],
3575
+ "_mm256_cvttpd_epu32"=>[["AVX512VL", "AVX512F"]],
3576
+ "_mm256_mask_cvttpd_epu32"=>[["AVX512VL", "AVX512F"]],
3577
+ "_mm256_maskz_cvttpd_epu32"=>[["AVX512VL", "AVX512F"]],
3578
+ "_mm_cvttpd_epu32"=>[["AVX512VL", "AVX512F"]],
3579
+ "_mm_mask_cvttpd_epu32"=>[["AVX512VL", "AVX512F"]],
3580
+ "_mm_maskz_cvttpd_epu32"=>[["AVX512VL", "AVX512F"]],
3581
+ "_mm256_cvttpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3582
+ "_mm256_mask_cvttpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3583
+ "_mm256_maskz_cvttpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3584
3584
  "_mm512_cvtt_roundpd_epu64"=>["AVX512DQ"],
3585
3585
  "_mm512_cvttpd_epu64"=>["AVX512DQ"],
3586
3586
  "_mm512_mask_cvtt_roundpd_epu64"=>["AVX512DQ"],
3587
3587
  "_mm512_mask_cvttpd_epu64"=>["AVX512DQ"],
3588
3588
  "_mm512_maskz_cvtt_roundpd_epu64"=>["AVX512DQ"],
3589
3589
  "_mm512_maskz_cvttpd_epu64"=>["AVX512DQ"],
3590
- "_mm_cvttpd_epu64"=>["AVX512VL", "AVX512DQ"],
3591
- "_mm_mask_cvttpd_epu64"=>["AVX512VL", "AVX512DQ"],
3592
- "_mm_maskz_cvttpd_epu64"=>["AVX512VL", "AVX512DQ"],
3593
- "_mm256_mask_cvttps_epi32"=>["AVX512VL", "AVX512F"],
3594
- "_mm256_maskz_cvttps_epi32"=>["AVX512VL", "AVX512F"],
3595
- "_mm_mask_cvttps_epi32"=>["AVX512VL", "AVX512F"],
3596
- "_mm_maskz_cvttps_epi32"=>["AVX512VL", "AVX512F"],
3597
- "_mm256_cvttps_epi64"=>["AVX512VL", "AVX512DQ"],
3598
- "_mm256_mask_cvttps_epi64"=>["AVX512VL", "AVX512DQ"],
3599
- "_mm256_maskz_cvttps_epi64"=>["AVX512VL", "AVX512DQ"],
3590
+ "_mm_cvttpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3591
+ "_mm_mask_cvttpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3592
+ "_mm_maskz_cvttpd_epu64"=>[["AVX512VL", "AVX512DQ"]],
3593
+ "_mm256_mask_cvttps_epi32"=>[["AVX512VL", "AVX512F"]],
3594
+ "_mm256_maskz_cvttps_epi32"=>[["AVX512VL", "AVX512F"]],
3595
+ "_mm_mask_cvttps_epi32"=>[["AVX512VL", "AVX512F"]],
3596
+ "_mm_maskz_cvttps_epi32"=>[["AVX512VL", "AVX512F"]],
3597
+ "_mm256_cvttps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3598
+ "_mm256_mask_cvttps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3599
+ "_mm256_maskz_cvttps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3600
3600
  "_mm512_cvtt_roundps_epi64"=>["AVX512DQ"],
3601
3601
  "_mm512_cvttps_epi64"=>["AVX512DQ"],
3602
3602
  "_mm512_mask_cvtt_roundps_epi64"=>["AVX512DQ"],
3603
3603
  "_mm512_mask_cvttps_epi64"=>["AVX512DQ"],
3604
3604
  "_mm512_maskz_cvtt_roundps_epi64"=>["AVX512DQ"],
3605
3605
  "_mm512_maskz_cvttps_epi64"=>["AVX512DQ"],
3606
- "_mm_cvttps_epi64"=>["AVX512VL", "AVX512DQ"],
3607
- "_mm_mask_cvttps_epi64"=>["AVX512VL", "AVX512DQ"],
3608
- "_mm_maskz_cvttps_epi64"=>["AVX512VL", "AVX512DQ"],
3609
- "_mm256_cvttps_epu32"=>["AVX512VL", "AVX512F"],
3610
- "_mm256_mask_cvttps_epu32"=>["AVX512VL", "AVX512F"],
3611
- "_mm256_maskz_cvttps_epu32"=>["AVX512VL", "AVX512F"],
3612
- "_mm_cvttps_epu32"=>["AVX512VL", "AVX512F"],
3613
- "_mm_mask_cvttps_epu32"=>["AVX512VL", "AVX512F"],
3614
- "_mm_maskz_cvttps_epu32"=>["AVX512VL", "AVX512F"],
3615
- "_mm256_cvttps_epu64"=>["AVX512VL", "AVX512DQ"],
3616
- "_mm256_mask_cvttps_epu64"=>["AVX512VL", "AVX512DQ"],
3617
- "_mm256_maskz_cvttps_epu64"=>["AVX512VL", "AVX512DQ"],
3606
+ "_mm_cvttps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3607
+ "_mm_mask_cvttps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3608
+ "_mm_maskz_cvttps_epi64"=>[["AVX512VL", "AVX512DQ"]],
3609
+ "_mm256_cvttps_epu32"=>[["AVX512VL", "AVX512F"]],
3610
+ "_mm256_mask_cvttps_epu32"=>[["AVX512VL", "AVX512F"]],
3611
+ "_mm256_maskz_cvttps_epu32"=>[["AVX512VL", "AVX512F"]],
3612
+ "_mm_cvttps_epu32"=>[["AVX512VL", "AVX512F"]],
3613
+ "_mm_mask_cvttps_epu32"=>[["AVX512VL", "AVX512F"]],
3614
+ "_mm_maskz_cvttps_epu32"=>[["AVX512VL", "AVX512F"]],
3615
+ "_mm256_cvttps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3616
+ "_mm256_mask_cvttps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3617
+ "_mm256_maskz_cvttps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3618
3618
  "_mm512_cvtt_roundps_epu64"=>["AVX512DQ"],
3619
3619
  "_mm512_cvttps_epu64"=>["AVX512DQ"],
3620
3620
  "_mm512_mask_cvtt_roundps_epu64"=>["AVX512DQ"],
3621
3621
  "_mm512_mask_cvttps_epu64"=>["AVX512DQ"],
3622
3622
  "_mm512_maskz_cvtt_roundps_epu64"=>["AVX512DQ"],
3623
3623
  "_mm512_maskz_cvttps_epu64"=>["AVX512DQ"],
3624
- "_mm_cvttps_epu64"=>["AVX512VL", "AVX512DQ"],
3625
- "_mm_mask_cvttps_epu64"=>["AVX512VL", "AVX512DQ"],
3626
- "_mm_maskz_cvttps_epu64"=>["AVX512VL", "AVX512DQ"],
3627
- "_mm256_cvtepu32_pd"=>["AVX512VL", "AVX512F"],
3628
- "_mm256_mask_cvtepu32_pd"=>["AVX512VL", "AVX512F"],
3629
- "_mm256_maskz_cvtepu32_pd"=>["AVX512VL", "AVX512F"],
3630
- "_mm_cvtepu32_pd"=>["AVX512VL", "AVX512F"],
3631
- "_mm_mask_cvtepu32_pd"=>["AVX512VL", "AVX512F"],
3632
- "_mm_maskz_cvtepu32_pd"=>["AVX512VL", "AVX512F"],
3633
- "_mm256_cvtepu64_pd"=>["AVX512VL", "AVX512DQ"],
3634
- "_mm256_mask_cvtepu64_pd"=>["AVX512VL", "AVX512DQ"],
3635
- "_mm256_maskz_cvtepu64_pd"=>["AVX512VL", "AVX512DQ"],
3624
+ "_mm_cvttps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3625
+ "_mm_mask_cvttps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3626
+ "_mm_maskz_cvttps_epu64"=>[["AVX512VL", "AVX512DQ"]],
3627
+ "_mm256_cvtepu32_pd"=>[["AVX512VL", "AVX512F"]],
3628
+ "_mm256_mask_cvtepu32_pd"=>[["AVX512VL", "AVX512F"]],
3629
+ "_mm256_maskz_cvtepu32_pd"=>[["AVX512VL", "AVX512F"]],
3630
+ "_mm_cvtepu32_pd"=>[["AVX512VL", "AVX512F"]],
3631
+ "_mm_mask_cvtepu32_pd"=>[["AVX512VL", "AVX512F"]],
3632
+ "_mm_maskz_cvtepu32_pd"=>[["AVX512VL", "AVX512F"]],
3633
+ "_mm256_cvtepu64_pd"=>[["AVX512VL", "AVX512DQ"]],
3634
+ "_mm256_mask_cvtepu64_pd"=>[["AVX512VL", "AVX512DQ"]],
3635
+ "_mm256_maskz_cvtepu64_pd"=>[["AVX512VL", "AVX512DQ"]],
3636
3636
  "_mm512_cvt_roundepu64_pd"=>["AVX512DQ"],
3637
3637
  "_mm512_cvtepu64_pd"=>["AVX512DQ"],
3638
3638
  "_mm512_mask_cvt_roundepu64_pd"=>["AVX512DQ"],
3639
3639
  "_mm512_mask_cvtepu64_pd"=>["AVX512DQ"],
3640
3640
  "_mm512_maskz_cvt_roundepu64_pd"=>["AVX512DQ"],
3641
3641
  "_mm512_maskz_cvtepu64_pd"=>["AVX512DQ"],
3642
- "_mm_cvtepu64_pd"=>["AVX512VL", "AVX512DQ"],
3643
- "_mm_mask_cvtepu64_pd"=>["AVX512VL", "AVX512DQ"],
3644
- "_mm_maskz_cvtepu64_pd"=>["AVX512VL", "AVX512DQ"],
3645
- "_mm256_cvtepu64_ps"=>["AVX512VL", "AVX512DQ"],
3646
- "_mm256_mask_cvtepu64_ps"=>["AVX512VL", "AVX512DQ"],
3647
- "_mm256_maskz_cvtepu64_ps"=>["AVX512VL", "AVX512DQ"],
3642
+ "_mm_cvtepu64_pd"=>[["AVX512VL", "AVX512DQ"]],
3643
+ "_mm_mask_cvtepu64_pd"=>[["AVX512VL", "AVX512DQ"]],
3644
+ "_mm_maskz_cvtepu64_pd"=>[["AVX512VL", "AVX512DQ"]],
3645
+ "_mm256_cvtepu64_ps"=>[["AVX512VL", "AVX512DQ"]],
3646
+ "_mm256_mask_cvtepu64_ps"=>[["AVX512VL", "AVX512DQ"]],
3647
+ "_mm256_maskz_cvtepu64_ps"=>[["AVX512VL", "AVX512DQ"]],
3648
3648
  "_mm512_cvt_roundepu64_ps"=>["AVX512DQ"],
3649
3649
  "_mm512_cvtepu64_ps"=>["AVX512DQ"],
3650
3650
  "_mm512_mask_cvt_roundepu64_ps"=>["AVX512DQ"],
3651
3651
  "_mm512_mask_cvtepu64_ps"=>["AVX512DQ"],
3652
3652
  "_mm512_maskz_cvt_roundepu64_ps"=>["AVX512DQ"],
3653
3653
  "_mm512_maskz_cvtepu64_ps"=>["AVX512DQ"],
3654
- "_mm_cvtepu64_ps"=>["AVX512VL", "AVX512DQ"],
3655
- "_mm_mask_cvtepu64_ps"=>["AVX512VL", "AVX512DQ"],
3656
- "_mm_maskz_cvtepu64_ps"=>["AVX512VL", "AVX512DQ"],
3657
- "_mm256_dbsad_epu8"=>["AVX512VL", "AVX512BW"],
3658
- "_mm256_mask_dbsad_epu8"=>["AVX512VL", "AVX512BW"],
3659
- "_mm256_maskz_dbsad_epu8"=>["AVX512VL", "AVX512BW"],
3654
+ "_mm_cvtepu64_ps"=>[["AVX512VL", "AVX512DQ"]],
3655
+ "_mm_mask_cvtepu64_ps"=>[["AVX512VL", "AVX512DQ"]],
3656
+ "_mm_maskz_cvtepu64_ps"=>[["AVX512VL", "AVX512DQ"]],
3657
+ "_mm256_dbsad_epu8"=>[["AVX512VL", "AVX512BW"]],
3658
+ "_mm256_mask_dbsad_epu8"=>[["AVX512VL", "AVX512BW"]],
3659
+ "_mm256_maskz_dbsad_epu8"=>[["AVX512VL", "AVX512BW"]],
3660
3660
  "_mm512_dbsad_epu8"=>["AVX512BW"],
3661
3661
  "_mm512_mask_dbsad_epu8"=>["AVX512BW"],
3662
3662
  "_mm512_maskz_dbsad_epu8"=>["AVX512BW"],
3663
- "_mm_dbsad_epu8"=>["AVX512VL", "AVX512BW"],
3664
- "_mm_mask_dbsad_epu8"=>["AVX512VL", "AVX512BW"],
3665
- "_mm_maskz_dbsad_epu8"=>["AVX512VL", "AVX512BW"],
3666
- "_mm256_mask_div_pd"=>["AVX512VL", "AVX512F"],
3667
- "_mm256_maskz_div_pd"=>["AVX512VL", "AVX512F"],
3668
- "_mm_mask_div_pd"=>["AVX512VL", "AVX512F"],
3669
- "_mm_maskz_div_pd"=>["AVX512VL", "AVX512F"],
3670
- "_mm256_mask_div_ps"=>["AVX512VL", "AVX512F"],
3671
- "_mm256_maskz_div_ps"=>["AVX512VL", "AVX512F"],
3672
- "_mm_mask_div_ps"=>["AVX512VL", "AVX512F"],
3673
- "_mm_maskz_div_ps"=>["AVX512VL", "AVX512F"],
3674
- "_mm256_mask_expand_pd"=>["AVX512VL", "AVX512F"],
3675
- "_mm256_mask_expandloadu_pd"=>["AVX512VL", "AVX512F"],
3676
- "_mm256_maskz_expand_pd"=>["AVX512VL", "AVX512F"],
3677
- "_mm256_maskz_expandloadu_pd"=>["AVX512VL", "AVX512F"],
3678
- "_mm_mask_expand_pd"=>["AVX512VL", "AVX512F"],
3679
- "_mm_mask_expandloadu_pd"=>["AVX512VL", "AVX512F"],
3680
- "_mm_maskz_expand_pd"=>["AVX512VL", "AVX512F"],
3681
- "_mm_maskz_expandloadu_pd"=>["AVX512VL", "AVX512F"],
3682
- "_mm256_mask_expand_ps"=>["AVX512VL", "AVX512F"],
3683
- "_mm256_mask_expandloadu_ps"=>["AVX512VL", "AVX512F"],
3684
- "_mm256_maskz_expand_ps"=>["AVX512VL", "AVX512F"],
3685
- "_mm256_maskz_expandloadu_ps"=>["AVX512VL", "AVX512F"],
3686
- "_mm_mask_expand_ps"=>["AVX512VL", "AVX512F"],
3687
- "_mm_mask_expandloadu_ps"=>["AVX512VL", "AVX512F"],
3688
- "_mm_maskz_expand_ps"=>["AVX512VL", "AVX512F"],
3689
- "_mm_maskz_expandloadu_ps"=>["AVX512VL", "AVX512F"],
3690
- "_mm256_extractf32x4_ps"=>["AVX512VL", "AVX512F"],
3691
- "_mm256_mask_extractf32x4_ps"=>["AVX512VL", "AVX512F"],
3692
- "_mm256_maskz_extractf32x4_ps"=>["AVX512VL", "AVX512F"],
3663
+ "_mm_dbsad_epu8"=>[["AVX512VL", "AVX512BW"]],
3664
+ "_mm_mask_dbsad_epu8"=>[["AVX512VL", "AVX512BW"]],
3665
+ "_mm_maskz_dbsad_epu8"=>[["AVX512VL", "AVX512BW"]],
3666
+ "_mm256_mask_div_pd"=>[["AVX512VL", "AVX512F"]],
3667
+ "_mm256_maskz_div_pd"=>[["AVX512VL", "AVX512F"]],
3668
+ "_mm_mask_div_pd"=>[["AVX512VL", "AVX512F"]],
3669
+ "_mm_maskz_div_pd"=>[["AVX512VL", "AVX512F"]],
3670
+ "_mm256_mask_div_ps"=>[["AVX512VL", "AVX512F"]],
3671
+ "_mm256_maskz_div_ps"=>[["AVX512VL", "AVX512F"]],
3672
+ "_mm_mask_div_ps"=>[["AVX512VL", "AVX512F"]],
3673
+ "_mm_maskz_div_ps"=>[["AVX512VL", "AVX512F"]],
3674
+ "_mm256_mask_expand_pd"=>[["AVX512VL", "AVX512F"]],
3675
+ "_mm256_mask_expandloadu_pd"=>[["AVX512VL", "AVX512F"]],
3676
+ "_mm256_maskz_expand_pd"=>[["AVX512VL", "AVX512F"]],
3677
+ "_mm256_maskz_expandloadu_pd"=>[["AVX512VL", "AVX512F"]],
3678
+ "_mm_mask_expand_pd"=>[["AVX512VL", "AVX512F"]],
3679
+ "_mm_mask_expandloadu_pd"=>[["AVX512VL", "AVX512F"]],
3680
+ "_mm_maskz_expand_pd"=>[["AVX512VL", "AVX512F"]],
3681
+ "_mm_maskz_expandloadu_pd"=>[["AVX512VL", "AVX512F"]],
3682
+ "_mm256_mask_expand_ps"=>[["AVX512VL", "AVX512F"]],
3683
+ "_mm256_mask_expandloadu_ps"=>[["AVX512VL", "AVX512F"]],
3684
+ "_mm256_maskz_expand_ps"=>[["AVX512VL", "AVX512F"]],
3685
+ "_mm256_maskz_expandloadu_ps"=>[["AVX512VL", "AVX512F"]],
3686
+ "_mm_mask_expand_ps"=>[["AVX512VL", "AVX512F"]],
3687
+ "_mm_mask_expandloadu_ps"=>[["AVX512VL", "AVX512F"]],
3688
+ "_mm_maskz_expand_ps"=>[["AVX512VL", "AVX512F"]],
3689
+ "_mm_maskz_expandloadu_ps"=>[["AVX512VL", "AVX512F"]],
3690
+ "_mm256_extractf32x4_ps"=>[["AVX512VL", "AVX512F"]],
3691
+ "_mm256_mask_extractf32x4_ps"=>[["AVX512VL", "AVX512F"]],
3692
+ "_mm256_maskz_extractf32x4_ps"=>[["AVX512VL", "AVX512F"]],
3693
3693
  "_mm512_extractf32x8_ps"=>["AVX512DQ"],
3694
3694
  "_mm512_mask_extractf32x8_ps"=>["AVX512DQ"],
3695
3695
  "_mm512_maskz_extractf32x8_ps"=>["AVX512DQ"],
3696
- "_mm256_extractf64x2_pd"=>["AVX512VL", "AVX512DQ"],
3697
- "_mm256_mask_extractf64x2_pd"=>["AVX512VL", "AVX512DQ"],
3698
- "_mm256_maskz_extractf64x2_pd"=>["AVX512VL", "AVX512DQ"],
3696
+ "_mm256_extractf64x2_pd"=>[["AVX512VL", "AVX512DQ"]],
3697
+ "_mm256_mask_extractf64x2_pd"=>[["AVX512VL", "AVX512DQ"]],
3698
+ "_mm256_maskz_extractf64x2_pd"=>[["AVX512VL", "AVX512DQ"]],
3699
3699
  "_mm512_extractf64x2_pd"=>["AVX512DQ"],
3700
3700
  "_mm512_mask_extractf64x2_pd"=>["AVX512DQ"],
3701
3701
  "_mm512_maskz_extractf64x2_pd"=>["AVX512DQ"],
3702
- "_mm256_extracti32x4_epi32"=>["AVX512VL", "AVX512F"],
3703
- "_mm256_mask_extracti32x4_epi32"=>["AVX512VL", "AVX512F"],
3704
- "_mm256_maskz_extracti32x4_epi32"=>["AVX512VL", "AVX512F"],
3702
+ "_mm256_extracti32x4_epi32"=>[["AVX512VL", "AVX512F"]],
3703
+ "_mm256_mask_extracti32x4_epi32"=>[["AVX512VL", "AVX512F"]],
3704
+ "_mm256_maskz_extracti32x4_epi32"=>[["AVX512VL", "AVX512F"]],
3705
3705
  "_mm512_extracti32x8_epi32"=>["AVX512DQ"],
3706
3706
  "_mm512_mask_extracti32x8_epi32"=>["AVX512DQ"],
3707
3707
  "_mm512_maskz_extracti32x8_epi32"=>["AVX512DQ"],
3708
- "_mm256_extracti64x2_epi64"=>["AVX512VL", "AVX512DQ"],
3709
- "_mm256_mask_extracti64x2_epi64"=>["AVX512VL", "AVX512DQ"],
3710
- "_mm256_maskz_extracti64x2_epi64"=>["AVX512VL", "AVX512DQ"],
3708
+ "_mm256_extracti64x2_epi64"=>[["AVX512VL", "AVX512DQ"]],
3709
+ "_mm256_mask_extracti64x2_epi64"=>[["AVX512VL", "AVX512DQ"]],
3710
+ "_mm256_maskz_extracti64x2_epi64"=>[["AVX512VL", "AVX512DQ"]],
3711
3711
  "_mm512_extracti64x2_epi64"=>["AVX512DQ"],
3712
3712
  "_mm512_mask_extracti64x2_epi64"=>["AVX512DQ"],
3713
3713
  "_mm512_maskz_extracti64x2_epi64"=>["AVX512DQ"],
3714
- "_mm256_fixupimm_pd"=>["AVX512VL", "AVX512F"],
3715
- "_mm256_mask_fixupimm_pd"=>["AVX512VL", "AVX512F"],
3716
- "_mm256_maskz_fixupimm_pd"=>["AVX512VL", "AVX512F"],
3717
- "_mm_fixupimm_pd"=>["AVX512VL", "AVX512F"],
3718
- "_mm_mask_fixupimm_pd"=>["AVX512VL", "AVX512F"],
3719
- "_mm_maskz_fixupimm_pd"=>["AVX512VL", "AVX512F"],
3720
- "_mm256_fixupimm_ps"=>["AVX512VL", "AVX512F"],
3721
- "_mm256_mask_fixupimm_ps"=>["AVX512VL", "AVX512F"],
3722
- "_mm256_maskz_fixupimm_ps"=>["AVX512VL", "AVX512F"],
3723
- "_mm_fixupimm_ps"=>["AVX512VL", "AVX512F"],
3724
- "_mm_mask_fixupimm_ps"=>["AVX512VL", "AVX512F"],
3725
- "_mm_maskz_fixupimm_ps"=>["AVX512VL", "AVX512F"],
3726
- "_mm256_mask3_fmadd_pd"=>["AVX512VL", "AVX512F"],
3727
- "_mm256_mask_fmadd_pd"=>["AVX512VL", "AVX512F"],
3728
- "_mm256_maskz_fmadd_pd"=>["AVX512VL", "AVX512F"],
3729
- "_mm_mask3_fmadd_pd"=>["AVX512VL", "AVX512F"],
3730
- "_mm_mask_fmadd_pd"=>["AVX512VL", "AVX512F"],
3731
- "_mm_maskz_fmadd_pd"=>["AVX512VL", "AVX512F"],
3732
- "_mm256_mask3_fmadd_ps"=>["AVX512VL", "AVX512F"],
3733
- "_mm256_mask_fmadd_ps"=>["AVX512VL", "AVX512F"],
3734
- "_mm256_maskz_fmadd_ps"=>["AVX512VL", "AVX512F"],
3735
- "_mm_mask3_fmadd_ps"=>["AVX512VL", "AVX512F"],
3736
- "_mm_mask_fmadd_ps"=>["AVX512VL", "AVX512F"],
3737
- "_mm_maskz_fmadd_ps"=>["AVX512VL", "AVX512F"],
3738
- "_mm256_mask3_fmaddsub_pd"=>["AVX512VL", "AVX512F"],
3739
- "_mm256_mask_fmaddsub_pd"=>["AVX512VL", "AVX512F"],
3740
- "_mm256_maskz_fmaddsub_pd"=>["AVX512VL", "AVX512F"],
3741
- "_mm_mask3_fmaddsub_pd"=>["AVX512VL", "AVX512F"],
3742
- "_mm_mask_fmaddsub_pd"=>["AVX512VL", "AVX512F"],
3743
- "_mm_maskz_fmaddsub_pd"=>["AVX512VL", "AVX512F"],
3744
- "_mm256_mask3_fmaddsub_ps"=>["AVX512VL", "AVX512F"],
3745
- "_mm256_mask_fmaddsub_ps"=>["AVX512VL", "AVX512F"],
3746
- "_mm256_maskz_fmaddsub_ps"=>["AVX512VL", "AVX512F"],
3747
- "_mm_mask3_fmaddsub_ps"=>["AVX512VL", "AVX512F"],
3748
- "_mm_mask_fmaddsub_ps"=>["AVX512VL", "AVX512F"],
3749
- "_mm_maskz_fmaddsub_ps"=>["AVX512VL", "AVX512F"],
3750
- "_mm256_mask3_fmsub_pd"=>["AVX512VL", "AVX512F"],
3751
- "_mm256_mask_fmsub_pd"=>["AVX512VL", "AVX512F"],
3752
- "_mm256_maskz_fmsub_pd"=>["AVX512VL", "AVX512F"],
3753
- "_mm_mask3_fmsub_pd"=>["AVX512VL", "AVX512F"],
3754
- "_mm_mask_fmsub_pd"=>["AVX512VL", "AVX512F"],
3755
- "_mm_maskz_fmsub_pd"=>["AVX512VL", "AVX512F"],
3756
- "_mm256_mask3_fmsub_ps"=>["AVX512VL", "AVX512F"],
3757
- "_mm256_mask_fmsub_ps"=>["AVX512VL", "AVX512F"],
3758
- "_mm256_maskz_fmsub_ps"=>["AVX512VL", "AVX512F"],
3759
- "_mm_mask3_fmsub_ps"=>["AVX512VL", "AVX512F"],
3760
- "_mm_mask_fmsub_ps"=>["AVX512VL", "AVX512F"],
3761
- "_mm_maskz_fmsub_ps"=>["AVX512VL", "AVX512F"],
3762
- "_mm256_mask3_fmsubadd_pd"=>["AVX512VL", "AVX512F"],
3763
- "_mm256_mask_fmsubadd_pd"=>["AVX512VL", "AVX512F"],
3764
- "_mm256_maskz_fmsubadd_pd"=>["AVX512VL", "AVX512F"],
3765
- "_mm_mask3_fmsubadd_pd"=>["AVX512VL", "AVX512F"],
3766
- "_mm_mask_fmsubadd_pd"=>["AVX512VL", "AVX512F"],
3767
- "_mm_maskz_fmsubadd_pd"=>["AVX512VL", "AVX512F"],
3768
- "_mm256_mask3_fmsubadd_ps"=>["AVX512VL", "AVX512F"],
3769
- "_mm256_mask_fmsubadd_ps"=>["AVX512VL", "AVX512F"],
3770
- "_mm256_maskz_fmsubadd_ps"=>["AVX512VL", "AVX512F"],
3771
- "_mm_mask3_fmsubadd_ps"=>["AVX512VL", "AVX512F"],
3772
- "_mm_mask_fmsubadd_ps"=>["AVX512VL", "AVX512F"],
3773
- "_mm_maskz_fmsubadd_ps"=>["AVX512VL", "AVX512F"],
3774
- "_mm256_mask3_fnmadd_pd"=>["AVX512VL", "AVX512F"],
3775
- "_mm256_mask_fnmadd_pd"=>["AVX512VL", "AVX512F"],
3776
- "_mm256_maskz_fnmadd_pd"=>["AVX512VL", "AVX512F"],
3777
- "_mm_mask3_fnmadd_pd"=>["AVX512VL", "AVX512F"],
3778
- "_mm_mask_fnmadd_pd"=>["AVX512VL", "AVX512F"],
3779
- "_mm_maskz_fnmadd_pd"=>["AVX512VL", "AVX512F"],
3780
- "_mm256_mask3_fnmadd_ps"=>["AVX512VL", "AVX512F"],
3781
- "_mm256_mask_fnmadd_ps"=>["AVX512VL", "AVX512F"],
3782
- "_mm256_maskz_fnmadd_ps"=>["AVX512VL", "AVX512F"],
3783
- "_mm_mask3_fnmadd_ps"=>["AVX512VL", "AVX512F"],
3784
- "_mm_mask_fnmadd_ps"=>["AVX512VL", "AVX512F"],
3785
- "_mm_maskz_fnmadd_ps"=>["AVX512VL", "AVX512F"],
3786
- "_mm256_mask3_fnmsub_pd"=>["AVX512VL", "AVX512F"],
3787
- "_mm256_mask_fnmsub_pd"=>["AVX512VL", "AVX512F"],
3788
- "_mm256_maskz_fnmsub_pd"=>["AVX512VL", "AVX512F"],
3789
- "_mm_mask3_fnmsub_pd"=>["AVX512VL", "AVX512F"],
3790
- "_mm_mask_fnmsub_pd"=>["AVX512VL", "AVX512F"],
3791
- "_mm_maskz_fnmsub_pd"=>["AVX512VL", "AVX512F"],
3792
- "_mm256_mask3_fnmsub_ps"=>["AVX512VL", "AVX512F"],
3793
- "_mm256_mask_fnmsub_ps"=>["AVX512VL", "AVX512F"],
3794
- "_mm256_maskz_fnmsub_ps"=>["AVX512VL", "AVX512F"],
3795
- "_mm_mask3_fnmsub_ps"=>["AVX512VL", "AVX512F"],
3796
- "_mm_mask_fnmsub_ps"=>["AVX512VL", "AVX512F"],
3797
- "_mm_maskz_fnmsub_ps"=>["AVX512VL", "AVX512F"],
3798
- "_mm256_fpclass_pd_mask"=>["AVX512VL", "AVX512DQ"],
3799
- "_mm256_mask_fpclass_pd_mask"=>["AVX512VL", "AVX512DQ"],
3714
+ "_mm256_fixupimm_pd"=>[["AVX512VL", "AVX512F"]],
3715
+ "_mm256_mask_fixupimm_pd"=>[["AVX512VL", "AVX512F"]],
3716
+ "_mm256_maskz_fixupimm_pd"=>[["AVX512VL", "AVX512F"]],
3717
+ "_mm_fixupimm_pd"=>[["AVX512VL", "AVX512F"]],
3718
+ "_mm_mask_fixupimm_pd"=>[["AVX512VL", "AVX512F"]],
3719
+ "_mm_maskz_fixupimm_pd"=>[["AVX512VL", "AVX512F"]],
3720
+ "_mm256_fixupimm_ps"=>[["AVX512VL", "AVX512F"]],
3721
+ "_mm256_mask_fixupimm_ps"=>[["AVX512VL", "AVX512F"]],
3722
+ "_mm256_maskz_fixupimm_ps"=>[["AVX512VL", "AVX512F"]],
3723
+ "_mm_fixupimm_ps"=>[["AVX512VL", "AVX512F"]],
3724
+ "_mm_mask_fixupimm_ps"=>[["AVX512VL", "AVX512F"]],
3725
+ "_mm_maskz_fixupimm_ps"=>[["AVX512VL", "AVX512F"]],
3726
+ "_mm256_mask3_fmadd_pd"=>[["AVX512VL", "AVX512F"]],
3727
+ "_mm256_mask_fmadd_pd"=>[["AVX512VL", "AVX512F"]],
3728
+ "_mm256_maskz_fmadd_pd"=>[["AVX512VL", "AVX512F"]],
3729
+ "_mm_mask3_fmadd_pd"=>[["AVX512VL", "AVX512F"]],
3730
+ "_mm_mask_fmadd_pd"=>[["AVX512VL", "AVX512F"]],
3731
+ "_mm_maskz_fmadd_pd"=>[["AVX512VL", "AVX512F"]],
3732
+ "_mm256_mask3_fmadd_ps"=>[["AVX512VL", "AVX512F"]],
3733
+ "_mm256_mask_fmadd_ps"=>[["AVX512VL", "AVX512F"]],
3734
+ "_mm256_maskz_fmadd_ps"=>[["AVX512VL", "AVX512F"]],
3735
+ "_mm_mask3_fmadd_ps"=>[["AVX512VL", "AVX512F"]],
3736
+ "_mm_mask_fmadd_ps"=>[["AVX512VL", "AVX512F"]],
3737
+ "_mm_maskz_fmadd_ps"=>[["AVX512VL", "AVX512F"]],
3738
+ "_mm256_mask3_fmaddsub_pd"=>[["AVX512VL", "AVX512F"]],
3739
+ "_mm256_mask_fmaddsub_pd"=>[["AVX512VL", "AVX512F"]],
3740
+ "_mm256_maskz_fmaddsub_pd"=>[["AVX512VL", "AVX512F"]],
3741
+ "_mm_mask3_fmaddsub_pd"=>[["AVX512VL", "AVX512F"]],
3742
+ "_mm_mask_fmaddsub_pd"=>[["AVX512VL", "AVX512F"]],
3743
+ "_mm_maskz_fmaddsub_pd"=>[["AVX512VL", "AVX512F"]],
3744
+ "_mm256_mask3_fmaddsub_ps"=>[["AVX512VL", "AVX512F"]],
3745
+ "_mm256_mask_fmaddsub_ps"=>[["AVX512VL", "AVX512F"]],
3746
+ "_mm256_maskz_fmaddsub_ps"=>[["AVX512VL", "AVX512F"]],
3747
+ "_mm_mask3_fmaddsub_ps"=>[["AVX512VL", "AVX512F"]],
3748
+ "_mm_mask_fmaddsub_ps"=>[["AVX512VL", "AVX512F"]],
3749
+ "_mm_maskz_fmaddsub_ps"=>[["AVX512VL", "AVX512F"]],
3750
+ "_mm256_mask3_fmsub_pd"=>[["AVX512VL", "AVX512F"]],
3751
+ "_mm256_mask_fmsub_pd"=>[["AVX512VL", "AVX512F"]],
3752
+ "_mm256_maskz_fmsub_pd"=>[["AVX512VL", "AVX512F"]],
3753
+ "_mm_mask3_fmsub_pd"=>[["AVX512VL", "AVX512F"]],
3754
+ "_mm_mask_fmsub_pd"=>[["AVX512VL", "AVX512F"]],
3755
+ "_mm_maskz_fmsub_pd"=>[["AVX512VL", "AVX512F"]],
3756
+ "_mm256_mask3_fmsub_ps"=>[["AVX512VL", "AVX512F"]],
3757
+ "_mm256_mask_fmsub_ps"=>[["AVX512VL", "AVX512F"]],
3758
+ "_mm256_maskz_fmsub_ps"=>[["AVX512VL", "AVX512F"]],
3759
+ "_mm_mask3_fmsub_ps"=>[["AVX512VL", "AVX512F"]],
3760
+ "_mm_mask_fmsub_ps"=>[["AVX512VL", "AVX512F"]],
3761
+ "_mm_maskz_fmsub_ps"=>[["AVX512VL", "AVX512F"]],
3762
+ "_mm256_mask3_fmsubadd_pd"=>[["AVX512VL", "AVX512F"]],
3763
+ "_mm256_mask_fmsubadd_pd"=>[["AVX512VL", "AVX512F"]],
3764
+ "_mm256_maskz_fmsubadd_pd"=>[["AVX512VL", "AVX512F"]],
3765
+ "_mm_mask3_fmsubadd_pd"=>[["AVX512VL", "AVX512F"]],
3766
+ "_mm_mask_fmsubadd_pd"=>[["AVX512VL", "AVX512F"]],
3767
+ "_mm_maskz_fmsubadd_pd"=>[["AVX512VL", "AVX512F"]],
3768
+ "_mm256_mask3_fmsubadd_ps"=>[["AVX512VL", "AVX512F"]],
3769
+ "_mm256_mask_fmsubadd_ps"=>[["AVX512VL", "AVX512F"]],
3770
+ "_mm256_maskz_fmsubadd_ps"=>[["AVX512VL", "AVX512F"]],
3771
+ "_mm_mask3_fmsubadd_ps"=>[["AVX512VL", "AVX512F"]],
3772
+ "_mm_mask_fmsubadd_ps"=>[["AVX512VL", "AVX512F"]],
3773
+ "_mm_maskz_fmsubadd_ps"=>[["AVX512VL", "AVX512F"]],
3774
+ "_mm256_mask3_fnmadd_pd"=>[["AVX512VL", "AVX512F"]],
3775
+ "_mm256_mask_fnmadd_pd"=>[["AVX512VL", "AVX512F"]],
3776
+ "_mm256_maskz_fnmadd_pd"=>[["AVX512VL", "AVX512F"]],
3777
+ "_mm_mask3_fnmadd_pd"=>[["AVX512VL", "AVX512F"]],
3778
+ "_mm_mask_fnmadd_pd"=>[["AVX512VL", "AVX512F"]],
3779
+ "_mm_maskz_fnmadd_pd"=>[["AVX512VL", "AVX512F"]],
3780
+ "_mm256_mask3_fnmadd_ps"=>[["AVX512VL", "AVX512F"]],
3781
+ "_mm256_mask_fnmadd_ps"=>[["AVX512VL", "AVX512F"]],
3782
+ "_mm256_maskz_fnmadd_ps"=>[["AVX512VL", "AVX512F"]],
3783
+ "_mm_mask3_fnmadd_ps"=>[["AVX512VL", "AVX512F"]],
3784
+ "_mm_mask_fnmadd_ps"=>[["AVX512VL", "AVX512F"]],
3785
+ "_mm_maskz_fnmadd_ps"=>[["AVX512VL", "AVX512F"]],
3786
+ "_mm256_mask3_fnmsub_pd"=>[["AVX512VL", "AVX512F"]],
3787
+ "_mm256_mask_fnmsub_pd"=>[["AVX512VL", "AVX512F"]],
3788
+ "_mm256_maskz_fnmsub_pd"=>[["AVX512VL", "AVX512F"]],
3789
+ "_mm_mask3_fnmsub_pd"=>[["AVX512VL", "AVX512F"]],
3790
+ "_mm_mask_fnmsub_pd"=>[["AVX512VL", "AVX512F"]],
3791
+ "_mm_maskz_fnmsub_pd"=>[["AVX512VL", "AVX512F"]],
3792
+ "_mm256_mask3_fnmsub_ps"=>[["AVX512VL", "AVX512F"]],
3793
+ "_mm256_mask_fnmsub_ps"=>[["AVX512VL", "AVX512F"]],
3794
+ "_mm256_maskz_fnmsub_ps"=>[["AVX512VL", "AVX512F"]],
3795
+ "_mm_mask3_fnmsub_ps"=>[["AVX512VL", "AVX512F"]],
3796
+ "_mm_mask_fnmsub_ps"=>[["AVX512VL", "AVX512F"]],
3797
+ "_mm_maskz_fnmsub_ps"=>[["AVX512VL", "AVX512F"]],
3798
+ "_mm256_fpclass_pd_mask"=>[["AVX512VL", "AVX512DQ"]],
3799
+ "_mm256_mask_fpclass_pd_mask"=>[["AVX512VL", "AVX512DQ"]],
3800
3800
  "_mm512_fpclass_pd_mask"=>["AVX512DQ"],
3801
3801
  "_mm512_mask_fpclass_pd_mask"=>["AVX512DQ"],
3802
- "_mm_fpclass_pd_mask"=>["AVX512VL", "AVX512DQ"],
3803
- "_mm_mask_fpclass_pd_mask"=>["AVX512VL", "AVX512DQ"],
3804
- "_mm256_fpclass_ps_mask"=>["AVX512VL", "AVX512DQ"],
3805
- "_mm256_mask_fpclass_ps_mask"=>["AVX512VL", "AVX512DQ"],
3802
+ "_mm_fpclass_pd_mask"=>[["AVX512VL", "AVX512DQ"]],
3803
+ "_mm_mask_fpclass_pd_mask"=>[["AVX512VL", "AVX512DQ"]],
3804
+ "_mm256_fpclass_ps_mask"=>[["AVX512VL", "AVX512DQ"]],
3805
+ "_mm256_mask_fpclass_ps_mask"=>[["AVX512VL", "AVX512DQ"]],
3806
3806
  "_mm512_fpclass_ps_mask"=>["AVX512DQ"],
3807
3807
  "_mm512_mask_fpclass_ps_mask"=>["AVX512DQ"],
3808
- "_mm_fpclass_ps_mask"=>["AVX512VL", "AVX512DQ"],
3809
- "_mm_mask_fpclass_ps_mask"=>["AVX512VL", "AVX512DQ"],
3808
+ "_mm_fpclass_ps_mask"=>[["AVX512VL", "AVX512DQ"]],
3809
+ "_mm_mask_fpclass_ps_mask"=>[["AVX512VL", "AVX512DQ"]],
3810
3810
  "_mm_fpclass_sd_mask"=>["AVX512DQ"],
3811
3811
  "_mm_mask_fpclass_sd_mask"=>["AVX512DQ"],
3812
3812
  "_mm_fpclass_ss_mask"=>["AVX512DQ"],
3813
3813
  "_mm_mask_fpclass_ss_mask"=>["AVX512DQ"],
3814
- "_mm256_mmask_i32gather_pd"=>["AVX512VL", "AVX512F"],
3815
- "_mm_mmask_i32gather_pd"=>["AVX512VL", "AVX512F"],
3816
- "_mm256_mmask_i32gather_ps"=>["AVX512VL", "AVX512F"],
3817
- "_mm_mmask_i32gather_ps"=>["AVX512VL", "AVX512F"],
3818
- "_mm256_mmask_i64gather_pd"=>["AVX512VL", "AVX512F"],
3819
- "_mm_mmask_i64gather_pd"=>["AVX512VL", "AVX512F"],
3820
- "_mm256_mmask_i64gather_ps"=>["AVX512VL", "AVX512F"],
3821
- "_mm_mmask_i64gather_ps"=>["AVX512VL", "AVX512F"],
3822
- "_mm256_getexp_pd"=>["AVX512VL", "AVX512F"],
3823
- "_mm256_mask_getexp_pd"=>["AVX512VL", "AVX512F"],
3824
- "_mm256_maskz_getexp_pd"=>["AVX512VL", "AVX512F"],
3825
- "_mm_getexp_pd"=>["AVX512VL", "AVX512F"],
3826
- "_mm_mask_getexp_pd"=>["AVX512VL", "AVX512F"],
3827
- "_mm_maskz_getexp_pd"=>["AVX512VL", "AVX512F"],
3828
- "_mm256_getexp_ps"=>["AVX512VL", "AVX512F"],
3829
- "_mm256_mask_getexp_ps"=>["AVX512VL", "AVX512F"],
3830
- "_mm256_maskz_getexp_ps"=>["AVX512VL", "AVX512F"],
3831
- "_mm_getexp_ps"=>["AVX512VL", "AVX512F"],
3832
- "_mm_mask_getexp_ps"=>["AVX512VL", "AVX512F"],
3833
- "_mm_maskz_getexp_ps"=>["AVX512VL", "AVX512F"],
3834
- "_mm256_getmant_pd"=>["AVX512VL", "AVX512F"],
3835
- "_mm256_mask_getmant_pd"=>["AVX512VL", "AVX512F"],
3836
- "_mm256_maskz_getmant_pd"=>["AVX512VL", "AVX512F"],
3837
- "_mm_getmant_pd"=>["AVX512VL", "AVX512F"],
3838
- "_mm_mask_getmant_pd"=>["AVX512VL", "AVX512F"],
3839
- "_mm_maskz_getmant_pd"=>["AVX512VL", "AVX512F"],
3840
- "_mm256_getmant_ps"=>["AVX512VL", "AVX512F"],
3841
- "_mm256_mask_getmant_ps"=>["AVX512VL", "AVX512F"],
3842
- "_mm256_maskz_getmant_ps"=>["AVX512VL", "AVX512F"],
3843
- "_mm_getmant_ps"=>["AVX512VL", "AVX512F"],
3844
- "_mm_mask_getmant_ps"=>["AVX512VL", "AVX512F"],
3845
- "_mm_maskz_getmant_ps"=>["AVX512VL", "AVX512F"],
3846
- "_mm256_insertf32x4"=>["AVX512VL", "AVX512F"],
3847
- "_mm256_mask_insertf32x4"=>["AVX512VL", "AVX512F"],
3848
- "_mm256_maskz_insertf32x4"=>["AVX512VL", "AVX512F"],
3814
+ "_mm256_mmask_i32gather_pd"=>[["AVX512VL", "AVX512F"]],
3815
+ "_mm_mmask_i32gather_pd"=>[["AVX512VL", "AVX512F"]],
3816
+ "_mm256_mmask_i32gather_ps"=>[["AVX512VL", "AVX512F"]],
3817
+ "_mm_mmask_i32gather_ps"=>[["AVX512VL", "AVX512F"]],
3818
+ "_mm256_mmask_i64gather_pd"=>[["AVX512VL", "AVX512F"]],
3819
+ "_mm_mmask_i64gather_pd"=>[["AVX512VL", "AVX512F"]],
3820
+ "_mm256_mmask_i64gather_ps"=>[["AVX512VL", "AVX512F"]],
3821
+ "_mm_mmask_i64gather_ps"=>[["AVX512VL", "AVX512F"]],
3822
+ "_mm256_getexp_pd"=>[["AVX512VL", "AVX512F"]],
3823
+ "_mm256_mask_getexp_pd"=>[["AVX512VL", "AVX512F"]],
3824
+ "_mm256_maskz_getexp_pd"=>[["AVX512VL", "AVX512F"]],
3825
+ "_mm_getexp_pd"=>[["AVX512VL", "AVX512F"]],
3826
+ "_mm_mask_getexp_pd"=>[["AVX512VL", "AVX512F"]],
3827
+ "_mm_maskz_getexp_pd"=>[["AVX512VL", "AVX512F"]],
3828
+ "_mm256_getexp_ps"=>[["AVX512VL", "AVX512F"]],
3829
+ "_mm256_mask_getexp_ps"=>[["AVX512VL", "AVX512F"]],
3830
+ "_mm256_maskz_getexp_ps"=>[["AVX512VL", "AVX512F"]],
3831
+ "_mm_getexp_ps"=>[["AVX512VL", "AVX512F"]],
3832
+ "_mm_mask_getexp_ps"=>[["AVX512VL", "AVX512F"]],
3833
+ "_mm_maskz_getexp_ps"=>[["AVX512VL", "AVX512F"]],
3834
+ "_mm256_getmant_pd"=>[["AVX512VL", "AVX512F"]],
3835
+ "_mm256_mask_getmant_pd"=>[["AVX512VL", "AVX512F"]],
3836
+ "_mm256_maskz_getmant_pd"=>[["AVX512VL", "AVX512F"]],
3837
+ "_mm_getmant_pd"=>[["AVX512VL", "AVX512F"]],
3838
+ "_mm_mask_getmant_pd"=>[["AVX512VL", "AVX512F"]],
3839
+ "_mm_maskz_getmant_pd"=>[["AVX512VL", "AVX512F"]],
3840
+ "_mm256_getmant_ps"=>[["AVX512VL", "AVX512F"]],
3841
+ "_mm256_mask_getmant_ps"=>[["AVX512VL", "AVX512F"]],
3842
+ "_mm256_maskz_getmant_ps"=>[["AVX512VL", "AVX512F"]],
3843
+ "_mm_getmant_ps"=>[["AVX512VL", "AVX512F"]],
3844
+ "_mm_mask_getmant_ps"=>[["AVX512VL", "AVX512F"]],
3845
+ "_mm_maskz_getmant_ps"=>[["AVX512VL", "AVX512F"]],
3846
+ "_mm256_insertf32x4"=>[["AVX512VL", "AVX512F"]],
3847
+ "_mm256_mask_insertf32x4"=>[["AVX512VL", "AVX512F"]],
3848
+ "_mm256_maskz_insertf32x4"=>[["AVX512VL", "AVX512F"]],
3849
3849
  "_mm512_insertf32x8"=>["AVX512DQ"],
3850
3850
  "_mm512_mask_insertf32x8"=>["AVX512DQ"],
3851
3851
  "_mm512_maskz_insertf32x8"=>["AVX512DQ"],
3852
- "_mm256_insertf64x2"=>["AVX512VL", "AVX512DQ"],
3853
- "_mm256_mask_insertf64x2"=>["AVX512VL", "AVX512DQ"],
3854
- "_mm256_maskz_insertf64x2"=>["AVX512VL", "AVX512DQ"],
3852
+ "_mm256_insertf64x2"=>[["AVX512VL", "AVX512DQ"]],
3853
+ "_mm256_mask_insertf64x2"=>[["AVX512VL", "AVX512DQ"]],
3854
+ "_mm256_maskz_insertf64x2"=>[["AVX512VL", "AVX512DQ"]],
3855
3855
  "_mm512_insertf64x2"=>["AVX512DQ"],
3856
3856
  "_mm512_mask_insertf64x2"=>["AVX512DQ"],
3857
3857
  "_mm512_maskz_insertf64x2"=>["AVX512DQ"],
3858
- "_mm256_inserti32x4"=>["AVX512VL", "AVX512F"],
3859
- "_mm256_mask_inserti32x4"=>["AVX512VL", "AVX512F"],
3860
- "_mm256_maskz_inserti32x4"=>["AVX512VL", "AVX512F"],
3858
+ "_mm256_inserti32x4"=>[["AVX512VL", "AVX512F"]],
3859
+ "_mm256_mask_inserti32x4"=>[["AVX512VL", "AVX512F"]],
3860
+ "_mm256_maskz_inserti32x4"=>[["AVX512VL", "AVX512F"]],
3861
3861
  "_mm512_inserti32x8"=>["AVX512DQ"],
3862
3862
  "_mm512_mask_inserti32x8"=>["AVX512DQ"],
3863
3863
  "_mm512_maskz_inserti32x8"=>["AVX512DQ"],
3864
- "_mm256_inserti64x2"=>["AVX512VL", "AVX512DQ"],
3865
- "_mm256_mask_inserti64x2"=>["AVX512VL", "AVX512DQ"],
3866
- "_mm256_maskz_inserti64x2"=>["AVX512VL", "AVX512DQ"],
3864
+ "_mm256_inserti64x2"=>[["AVX512VL", "AVX512DQ"]],
3865
+ "_mm256_mask_inserti64x2"=>[["AVX512VL", "AVX512DQ"]],
3866
+ "_mm256_maskz_inserti64x2"=>[["AVX512VL", "AVX512DQ"]],
3867
3867
  "_mm512_inserti64x2"=>["AVX512DQ"],
3868
3868
  "_mm512_mask_inserti64x2"=>["AVX512DQ"],
3869
3869
  "_mm512_maskz_inserti64x2"=>["AVX512DQ"],
3870
- "_mm256_mask_max_pd"=>["AVX512VL", "AVX512F"],
3871
- "_mm256_maskz_max_pd"=>["AVX512VL", "AVX512F"],
3872
- "_mm_mask_max_pd"=>["AVX512VL", "AVX512F"],
3873
- "_mm_maskz_max_pd"=>["AVX512VL", "AVX512F"],
3874
- "_mm256_mask_max_ps"=>["AVX512VL", "AVX512F"],
3875
- "_mm256_maskz_max_ps"=>["AVX512VL", "AVX512F"],
3876
- "_mm_mask_max_ps"=>["AVX512VL", "AVX512F"],
3877
- "_mm_maskz_max_ps"=>["AVX512VL", "AVX512F"],
3878
- "_mm256_mask_min_pd"=>["AVX512VL", "AVX512F"],
3879
- "_mm256_maskz_min_pd"=>["AVX512VL", "AVX512F"],
3880
- "_mm_mask_min_pd"=>["AVX512VL", "AVX512F"],
3881
- "_mm_maskz_min_pd"=>["AVX512VL", "AVX512F"],
3882
- "_mm256_mask_min_ps"=>["AVX512VL", "AVX512F"],
3883
- "_mm256_maskz_min_ps"=>["AVX512VL", "AVX512F"],
3884
- "_mm_mask_min_ps"=>["AVX512VL", "AVX512F"],
3885
- "_mm_maskz_min_ps"=>["AVX512VL", "AVX512F"],
3886
- "_mm256_mask_load_pd"=>["AVX512VL", "AVX512F"],
3887
- "_mm256_mask_mov_pd"=>["AVX512VL", "AVX512F"],
3888
- "_mm256_mask_store_pd"=>["AVX512VL", "AVX512F"],
3889
- "_mm256_maskz_load_pd"=>["AVX512VL", "AVX512F"],
3890
- "_mm256_maskz_mov_pd"=>["AVX512VL", "AVX512F"],
3891
- "_mm_mask_load_pd"=>["AVX512VL", "AVX512F"],
3892
- "_mm_mask_mov_pd"=>["AVX512VL", "AVX512F"],
3893
- "_mm_mask_store_pd"=>["AVX512VL", "AVX512F"],
3894
- "_mm_maskz_load_pd"=>["AVX512VL", "AVX512F"],
3895
- "_mm_maskz_mov_pd"=>["AVX512VL", "AVX512F"],
3896
- "_mm256_mask_load_ps"=>["AVX512VL", "AVX512F"],
3897
- "_mm256_mask_mov_ps"=>["AVX512VL", "AVX512F"],
3898
- "_mm256_mask_store_ps"=>["AVX512VL", "AVX512F"],
3899
- "_mm256_maskz_load_ps"=>["AVX512VL", "AVX512F"],
3900
- "_mm256_maskz_mov_ps"=>["AVX512VL", "AVX512F"],
3901
- "_mm_mask_load_ps"=>["AVX512VL", "AVX512F"],
3902
- "_mm_mask_mov_ps"=>["AVX512VL", "AVX512F"],
3903
- "_mm_mask_store_ps"=>["AVX512VL", "AVX512F"],
3904
- "_mm_maskz_load_ps"=>["AVX512VL", "AVX512F"],
3905
- "_mm_maskz_mov_ps"=>["AVX512VL", "AVX512F"],
3906
- "_mm256_mask_movedup_pd"=>["AVX512VL", "AVX512F"],
3907
- "_mm256_maskz_movedup_pd"=>["AVX512VL", "AVX512F"],
3908
- "_mm_mask_movedup_pd"=>["AVX512VL", "AVX512F"],
3909
- "_mm_maskz_movedup_pd"=>["AVX512VL", "AVX512F"],
3910
- "_mm256_mask_load_epi32"=>["AVX512VL", "AVX512F"],
3911
- "_mm256_mask_mov_epi32"=>["AVX512VL", "AVX512F"],
3912
- "_mm256_mask_store_epi32"=>["AVX512VL", "AVX512F"],
3913
- "_mm256_maskz_load_epi32"=>["AVX512VL", "AVX512F"],
3914
- "_mm256_maskz_mov_epi32"=>["AVX512VL", "AVX512F"],
3915
- "_mm_mask_load_epi32"=>["AVX512VL", "AVX512F"],
3916
- "_mm_mask_mov_epi32"=>["AVX512VL", "AVX512F"],
3917
- "_mm_mask_store_epi32"=>["AVX512VL", "AVX512F"],
3918
- "_mm_maskz_load_epi32"=>["AVX512VL", "AVX512F"],
3919
- "_mm_maskz_mov_epi32"=>["AVX512VL", "AVX512F"],
3920
- "_mm256_mask_load_epi64"=>["AVX512VL", "AVX512F"],
3921
- "_mm256_mask_mov_epi64"=>["AVX512VL", "AVX512F"],
3922
- "_mm256_mask_store_epi64"=>["AVX512VL", "AVX512F"],
3923
- "_mm256_maskz_load_epi64"=>["AVX512VL", "AVX512F"],
3924
- "_mm256_maskz_mov_epi64"=>["AVX512VL", "AVX512F"],
3925
- "_mm_mask_load_epi64"=>["AVX512VL", "AVX512F"],
3926
- "_mm_mask_mov_epi64"=>["AVX512VL", "AVX512F"],
3927
- "_mm_mask_store_epi64"=>["AVX512VL", "AVX512F"],
3928
- "_mm_maskz_load_epi64"=>["AVX512VL", "AVX512F"],
3929
- "_mm_maskz_mov_epi64"=>["AVX512VL", "AVX512F"],
3930
- "_mm256_mask_loadu_epi16"=>["AVX512VL", "AVX512BW"],
3931
- "_mm256_mask_mov_epi16"=>["AVX512VL", "AVX512BW"],
3932
- "_mm256_mask_storeu_epi16"=>["AVX512VL", "AVX512BW"],
3933
- "_mm256_maskz_loadu_epi16"=>["AVX512VL", "AVX512BW"],
3934
- "_mm256_maskz_mov_epi16"=>["AVX512VL", "AVX512BW"],
3870
+ "_mm256_mask_max_pd"=>[["AVX512VL", "AVX512F"]],
3871
+ "_mm256_maskz_max_pd"=>[["AVX512VL", "AVX512F"]],
3872
+ "_mm_mask_max_pd"=>[["AVX512VL", "AVX512F"]],
3873
+ "_mm_maskz_max_pd"=>[["AVX512VL", "AVX512F"]],
3874
+ "_mm256_mask_max_ps"=>[["AVX512VL", "AVX512F"]],
3875
+ "_mm256_maskz_max_ps"=>[["AVX512VL", "AVX512F"]],
3876
+ "_mm_mask_max_ps"=>[["AVX512VL", "AVX512F"]],
3877
+ "_mm_maskz_max_ps"=>[["AVX512VL", "AVX512F"]],
3878
+ "_mm256_mask_min_pd"=>[["AVX512VL", "AVX512F"]],
3879
+ "_mm256_maskz_min_pd"=>[["AVX512VL", "AVX512F"]],
3880
+ "_mm_mask_min_pd"=>[["AVX512VL", "AVX512F"]],
3881
+ "_mm_maskz_min_pd"=>[["AVX512VL", "AVX512F"]],
3882
+ "_mm256_mask_min_ps"=>[["AVX512VL", "AVX512F"]],
3883
+ "_mm256_maskz_min_ps"=>[["AVX512VL", "AVX512F"]],
3884
+ "_mm_mask_min_ps"=>[["AVX512VL", "AVX512F"]],
3885
+ "_mm_maskz_min_ps"=>[["AVX512VL", "AVX512F"]],
3886
+ "_mm256_mask_load_pd"=>[["AVX512VL", "AVX512F"]],
3887
+ "_mm256_mask_mov_pd"=>[["AVX512VL", "AVX512F"]],
3888
+ "_mm256_mask_store_pd"=>[["AVX512VL", "AVX512F"]],
3889
+ "_mm256_maskz_load_pd"=>[["AVX512VL", "AVX512F"]],
3890
+ "_mm256_maskz_mov_pd"=>[["AVX512VL", "AVX512F"]],
3891
+ "_mm_mask_load_pd"=>[["AVX512VL", "AVX512F"]],
3892
+ "_mm_mask_mov_pd"=>[["AVX512VL", "AVX512F"]],
3893
+ "_mm_mask_store_pd"=>[["AVX512VL", "AVX512F"]],
3894
+ "_mm_maskz_load_pd"=>[["AVX512VL", "AVX512F"]],
3895
+ "_mm_maskz_mov_pd"=>[["AVX512VL", "AVX512F"]],
3896
+ "_mm256_mask_load_ps"=>[["AVX512VL", "AVX512F"]],
3897
+ "_mm256_mask_mov_ps"=>[["AVX512VL", "AVX512F"]],
3898
+ "_mm256_mask_store_ps"=>[["AVX512VL", "AVX512F"]],
3899
+ "_mm256_maskz_load_ps"=>[["AVX512VL", "AVX512F"]],
3900
+ "_mm256_maskz_mov_ps"=>[["AVX512VL", "AVX512F"]],
3901
+ "_mm_mask_load_ps"=>[["AVX512VL", "AVX512F"]],
3902
+ "_mm_mask_mov_ps"=>[["AVX512VL", "AVX512F"]],
3903
+ "_mm_mask_store_ps"=>[["AVX512VL", "AVX512F"]],
3904
+ "_mm_maskz_load_ps"=>[["AVX512VL", "AVX512F"]],
3905
+ "_mm_maskz_mov_ps"=>[["AVX512VL", "AVX512F"]],
3906
+ "_mm256_mask_movedup_pd"=>[["AVX512VL", "AVX512F"]],
3907
+ "_mm256_maskz_movedup_pd"=>[["AVX512VL", "AVX512F"]],
3908
+ "_mm_mask_movedup_pd"=>[["AVX512VL", "AVX512F"]],
3909
+ "_mm_maskz_movedup_pd"=>[["AVX512VL", "AVX512F"]],
3910
+ "_mm256_mask_load_epi32"=>[["AVX512VL", "AVX512F"]],
3911
+ "_mm256_mask_mov_epi32"=>[["AVX512VL", "AVX512F"]],
3912
+ "_mm256_mask_store_epi32"=>[["AVX512VL", "AVX512F"]],
3913
+ "_mm256_maskz_load_epi32"=>[["AVX512VL", "AVX512F"]],
3914
+ "_mm256_maskz_mov_epi32"=>[["AVX512VL", "AVX512F"]],
3915
+ "_mm_mask_load_epi32"=>[["AVX512VL", "AVX512F"]],
3916
+ "_mm_mask_mov_epi32"=>[["AVX512VL", "AVX512F"]],
3917
+ "_mm_mask_store_epi32"=>[["AVX512VL", "AVX512F"]],
3918
+ "_mm_maskz_load_epi32"=>[["AVX512VL", "AVX512F"]],
3919
+ "_mm_maskz_mov_epi32"=>[["AVX512VL", "AVX512F"]],
3920
+ "_mm256_mask_load_epi64"=>[["AVX512VL", "AVX512F"]],
3921
+ "_mm256_mask_mov_epi64"=>[["AVX512VL", "AVX512F"]],
3922
+ "_mm256_mask_store_epi64"=>[["AVX512VL", "AVX512F"]],
3923
+ "_mm256_maskz_load_epi64"=>[["AVX512VL", "AVX512F"]],
3924
+ "_mm256_maskz_mov_epi64"=>[["AVX512VL", "AVX512F"]],
3925
+ "_mm_mask_load_epi64"=>[["AVX512VL", "AVX512F"]],
3926
+ "_mm_mask_mov_epi64"=>[["AVX512VL", "AVX512F"]],
3927
+ "_mm_mask_store_epi64"=>[["AVX512VL", "AVX512F"]],
3928
+ "_mm_maskz_load_epi64"=>[["AVX512VL", "AVX512F"]],
3929
+ "_mm_maskz_mov_epi64"=>[["AVX512VL", "AVX512F"]],
3930
+ "_mm256_mask_loadu_epi16"=>[["AVX512VL", "AVX512BW"]],
3931
+ "_mm256_mask_mov_epi16"=>[["AVX512VL", "AVX512BW"]],
3932
+ "_mm256_mask_storeu_epi16"=>[["AVX512VL", "AVX512BW"]],
3933
+ "_mm256_maskz_loadu_epi16"=>[["AVX512VL", "AVX512BW"]],
3934
+ "_mm256_maskz_mov_epi16"=>[["AVX512VL", "AVX512BW"]],
3935
3935
  "_mm512_mask_loadu_epi16"=>["AVX512BW"],
3936
3936
  "_mm512_mask_mov_epi16"=>["AVX512BW"],
3937
3937
  "_mm512_mask_storeu_epi16"=>["AVX512BW"],
3938
3938
  "_mm512_maskz_loadu_epi16"=>["AVX512BW"],
3939
3939
  "_mm512_maskz_mov_epi16"=>["AVX512BW"],
3940
- "_mm_mask_loadu_epi16"=>["AVX512VL", "AVX512BW"],
3941
- "_mm_mask_mov_epi16"=>["AVX512VL", "AVX512BW"],
3942
- "_mm_mask_storeu_epi16"=>["AVX512VL", "AVX512BW"],
3943
- "_mm_maskz_loadu_epi16"=>["AVX512VL", "AVX512BW"],
3944
- "_mm_maskz_mov_epi16"=>["AVX512VL", "AVX512BW"],
3945
- "_mm256_mask_loadu_epi32"=>["AVX512VL", "AVX512F"],
3946
- "_mm256_mask_storeu_epi32"=>["AVX512VL", "AVX512F"],
3947
- "_mm256_maskz_loadu_epi32"=>["AVX512VL", "AVX512F"],
3948
- "_mm_mask_loadu_epi32"=>["AVX512VL", "AVX512F"],
3949
- "_mm_mask_storeu_epi32"=>["AVX512VL", "AVX512F"],
3950
- "_mm_maskz_loadu_epi32"=>["AVX512VL", "AVX512F"],
3951
- "_mm256_mask_loadu_epi64"=>["AVX512VL", "AVX512F"],
3952
- "_mm256_mask_storeu_epi64"=>["AVX512VL", "AVX512F"],
3953
- "_mm256_maskz_loadu_epi64"=>["AVX512VL", "AVX512F"],
3954
- "_mm_mask_loadu_epi64"=>["AVX512VL", "AVX512F"],
3955
- "_mm_mask_storeu_epi64"=>["AVX512VL", "AVX512F"],
3956
- "_mm_maskz_loadu_epi64"=>["AVX512VL", "AVX512F"],
3957
- "_mm256_mask_loadu_epi8"=>["AVX512VL", "AVX512BW"],
3958
- "_mm256_mask_mov_epi8"=>["AVX512VL", "AVX512BW"],
3959
- "_mm256_mask_storeu_epi8"=>["AVX512VL", "AVX512BW"],
3960
- "_mm256_maskz_loadu_epi8"=>["AVX512VL", "AVX512BW"],
3961
- "_mm256_maskz_mov_epi8"=>["AVX512VL", "AVX512BW"],
3940
+ "_mm_mask_loadu_epi16"=>[["AVX512VL", "AVX512BW"]],
3941
+ "_mm_mask_mov_epi16"=>[["AVX512VL", "AVX512BW"]],
3942
+ "_mm_mask_storeu_epi16"=>[["AVX512VL", "AVX512BW"]],
3943
+ "_mm_maskz_loadu_epi16"=>[["AVX512VL", "AVX512BW"]],
3944
+ "_mm_maskz_mov_epi16"=>[["AVX512VL", "AVX512BW"]],
3945
+ "_mm256_mask_loadu_epi32"=>[["AVX512VL", "AVX512F"]],
3946
+ "_mm256_mask_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
3947
+ "_mm256_maskz_loadu_epi32"=>[["AVX512VL", "AVX512F"]],
3948
+ "_mm_mask_loadu_epi32"=>[["AVX512VL", "AVX512F"]],
3949
+ "_mm_mask_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
3950
+ "_mm_maskz_loadu_epi32"=>[["AVX512VL", "AVX512F"]],
3951
+ "_mm256_mask_loadu_epi64"=>[["AVX512VL", "AVX512F"]],
3952
+ "_mm256_mask_storeu_epi64"=>[["AVX512VL", "AVX512F"]],
3953
+ "_mm256_maskz_loadu_epi64"=>[["AVX512VL", "AVX512F"]],
3954
+ "_mm_mask_loadu_epi64"=>[["AVX512VL", "AVX512F"]],
3955
+ "_mm_mask_storeu_epi64"=>[["AVX512VL", "AVX512F"]],
3956
+ "_mm_maskz_loadu_epi64"=>[["AVX512VL", "AVX512F"]],
3957
+ "_mm256_mask_loadu_epi8"=>[["AVX512VL", "AVX512BW"]],
3958
+ "_mm256_mask_mov_epi8"=>[["AVX512VL", "AVX512BW"]],
3959
+ "_mm256_mask_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
3960
+ "_mm256_maskz_loadu_epi8"=>[["AVX512VL", "AVX512BW"]],
3961
+ "_mm256_maskz_mov_epi8"=>[["AVX512VL", "AVX512BW"]],
3962
3962
  "_mm512_mask_loadu_epi8"=>["AVX512BW"],
3963
3963
  "_mm512_mask_mov_epi8"=>["AVX512BW"],
3964
3964
  "_mm512_mask_storeu_epi8"=>["AVX512BW"],
3965
3965
  "_mm512_maskz_loadu_epi8"=>["AVX512BW"],
3966
3966
  "_mm512_maskz_mov_epi8"=>["AVX512BW"],
3967
- "_mm_mask_loadu_epi8"=>["AVX512VL", "AVX512BW"],
3968
- "_mm_mask_mov_epi8"=>["AVX512VL", "AVX512BW"],
3969
- "_mm_mask_storeu_epi8"=>["AVX512VL", "AVX512BW"],
3970
- "_mm_maskz_loadu_epi8"=>["AVX512VL", "AVX512BW"],
3971
- "_mm_maskz_mov_epi8"=>["AVX512VL", "AVX512BW"],
3972
- "_mm256_mask_movehdup_ps"=>["AVX512VL", "AVX512F"],
3973
- "_mm256_maskz_movehdup_ps"=>["AVX512VL", "AVX512F"],
3974
- "_mm_mask_movehdup_ps"=>["AVX512VL", "AVX512F"],
3975
- "_mm_maskz_movehdup_ps"=>["AVX512VL", "AVX512F"],
3976
- "_mm256_mask_moveldup_ps"=>["AVX512VL", "AVX512F"],
3977
- "_mm256_maskz_moveldup_ps"=>["AVX512VL", "AVX512F"],
3978
- "_mm_mask_moveldup_ps"=>["AVX512VL", "AVX512F"],
3979
- "_mm_maskz_moveldup_ps"=>["AVX512VL", "AVX512F"],
3980
- "_mm256_mask_loadu_pd"=>["AVX512VL", "AVX512F"],
3981
- "_mm256_mask_storeu_pd"=>["AVX512VL", "AVX512F"],
3982
- "_mm256_maskz_loadu_pd"=>["AVX512VL", "AVX512F"],
3983
- "_mm_mask_loadu_pd"=>["AVX512VL", "AVX512F"],
3984
- "_mm_mask_storeu_pd"=>["AVX512VL", "AVX512F"],
3985
- "_mm_maskz_loadu_pd"=>["AVX512VL", "AVX512F"],
3986
- "_mm256_mask_loadu_ps"=>["AVX512VL", "AVX512F"],
3987
- "_mm256_mask_storeu_ps"=>["AVX512VL", "AVX512F"],
3988
- "_mm256_maskz_loadu_ps"=>["AVX512VL", "AVX512F"],
3989
- "_mm_mask_loadu_ps"=>["AVX512VL", "AVX512F"],
3990
- "_mm_mask_storeu_ps"=>["AVX512VL", "AVX512F"],
3991
- "_mm_maskz_loadu_ps"=>["AVX512VL", "AVX512F"],
3992
- "_mm256_mask_mul_pd"=>["AVX512VL", "AVX512F"],
3993
- "_mm256_maskz_mul_pd"=>["AVX512VL", "AVX512F"],
3994
- "_mm_mask_mul_pd"=>["AVX512VL", "AVX512F"],
3995
- "_mm_maskz_mul_pd"=>["AVX512VL", "AVX512F"],
3996
- "_mm256_mask_mul_ps"=>["AVX512VL", "AVX512F"],
3997
- "_mm256_maskz_mul_ps"=>["AVX512VL", "AVX512F"],
3998
- "_mm_mask_mul_ps"=>["AVX512VL", "AVX512F"],
3999
- "_mm_maskz_mul_ps"=>["AVX512VL", "AVX512F"],
4000
- "_mm256_mask_or_pd"=>["AVX512VL", "AVX512DQ"],
4001
- "_mm256_maskz_or_pd"=>["AVX512VL", "AVX512DQ"],
3967
+ "_mm_mask_loadu_epi8"=>[["AVX512VL", "AVX512BW"]],
3968
+ "_mm_mask_mov_epi8"=>[["AVX512VL", "AVX512BW"]],
3969
+ "_mm_mask_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
3970
+ "_mm_maskz_loadu_epi8"=>[["AVX512VL", "AVX512BW"]],
3971
+ "_mm_maskz_mov_epi8"=>[["AVX512VL", "AVX512BW"]],
3972
+ "_mm256_mask_movehdup_ps"=>[["AVX512VL", "AVX512F"]],
3973
+ "_mm256_maskz_movehdup_ps"=>[["AVX512VL", "AVX512F"]],
3974
+ "_mm_mask_movehdup_ps"=>[["AVX512VL", "AVX512F"]],
3975
+ "_mm_maskz_movehdup_ps"=>[["AVX512VL", "AVX512F"]],
3976
+ "_mm256_mask_moveldup_ps"=>[["AVX512VL", "AVX512F"]],
3977
+ "_mm256_maskz_moveldup_ps"=>[["AVX512VL", "AVX512F"]],
3978
+ "_mm_mask_moveldup_ps"=>[["AVX512VL", "AVX512F"]],
3979
+ "_mm_maskz_moveldup_ps"=>[["AVX512VL", "AVX512F"]],
3980
+ "_mm256_mask_loadu_pd"=>[["AVX512VL", "AVX512F"]],
3981
+ "_mm256_mask_storeu_pd"=>[["AVX512VL", "AVX512F"]],
3982
+ "_mm256_maskz_loadu_pd"=>[["AVX512VL", "AVX512F"]],
3983
+ "_mm_mask_loadu_pd"=>[["AVX512VL", "AVX512F"]],
3984
+ "_mm_mask_storeu_pd"=>[["AVX512VL", "AVX512F"]],
3985
+ "_mm_maskz_loadu_pd"=>[["AVX512VL", "AVX512F"]],
3986
+ "_mm256_mask_loadu_ps"=>[["AVX512VL", "AVX512F"]],
3987
+ "_mm256_mask_storeu_ps"=>[["AVX512VL", "AVX512F"]],
3988
+ "_mm256_maskz_loadu_ps"=>[["AVX512VL", "AVX512F"]],
3989
+ "_mm_mask_loadu_ps"=>[["AVX512VL", "AVX512F"]],
3990
+ "_mm_mask_storeu_ps"=>[["AVX512VL", "AVX512F"]],
3991
+ "_mm_maskz_loadu_ps"=>[["AVX512VL", "AVX512F"]],
3992
+ "_mm256_mask_mul_pd"=>[["AVX512VL", "AVX512F"]],
3993
+ "_mm256_maskz_mul_pd"=>[["AVX512VL", "AVX512F"]],
3994
+ "_mm_mask_mul_pd"=>[["AVX512VL", "AVX512F"]],
3995
+ "_mm_maskz_mul_pd"=>[["AVX512VL", "AVX512F"]],
3996
+ "_mm256_mask_mul_ps"=>[["AVX512VL", "AVX512F"]],
3997
+ "_mm256_maskz_mul_ps"=>[["AVX512VL", "AVX512F"]],
3998
+ "_mm_mask_mul_ps"=>[["AVX512VL", "AVX512F"]],
3999
+ "_mm_maskz_mul_ps"=>[["AVX512VL", "AVX512F"]],
4000
+ "_mm256_mask_or_pd"=>[["AVX512VL", "AVX512DQ"]],
4001
+ "_mm256_maskz_or_pd"=>[["AVX512VL", "AVX512DQ"]],
4002
4002
  "_mm512_mask_or_pd"=>["AVX512DQ"],
4003
4003
  "_mm512_maskz_or_pd"=>["AVX512DQ"],
4004
4004
  "_mm512_or_pd"=>["AVX512DQ"],
4005
- "_mm_mask_or_pd"=>["AVX512VL", "AVX512DQ"],
4006
- "_mm_maskz_or_pd"=>["AVX512VL", "AVX512DQ"],
4007
- "_mm256_mask_or_ps"=>["AVX512VL", "AVX512DQ"],
4008
- "_mm256_maskz_or_ps"=>["AVX512VL", "AVX512DQ"],
4005
+ "_mm_mask_or_pd"=>[["AVX512VL", "AVX512DQ"]],
4006
+ "_mm_maskz_or_pd"=>[["AVX512VL", "AVX512DQ"]],
4007
+ "_mm256_mask_or_ps"=>[["AVX512VL", "AVX512DQ"]],
4008
+ "_mm256_maskz_or_ps"=>[["AVX512VL", "AVX512DQ"]],
4009
4009
  "_mm512_mask_or_ps"=>["AVX512DQ"],
4010
4010
  "_mm512_maskz_or_ps"=>["AVX512DQ"],
4011
4011
  "_mm512_or_ps"=>["AVX512DQ"],
4012
- "_mm_mask_or_ps"=>["AVX512VL", "AVX512DQ"],
4013
- "_mm_maskz_or_ps"=>["AVX512VL", "AVX512DQ"],
4014
- "_mm256_mask_abs_epi8"=>["AVX512VL", "AVX512BW"],
4015
- "_mm256_maskz_abs_epi8"=>["AVX512VL", "AVX512BW"],
4012
+ "_mm_mask_or_ps"=>[["AVX512VL", "AVX512DQ"]],
4013
+ "_mm_maskz_or_ps"=>[["AVX512VL", "AVX512DQ"]],
4014
+ "_mm256_mask_abs_epi8"=>[["AVX512VL", "AVX512BW"]],
4015
+ "_mm256_maskz_abs_epi8"=>[["AVX512VL", "AVX512BW"]],
4016
4016
  "_mm512_abs_epi8"=>["AVX512BW"],
4017
4017
  "_mm512_mask_abs_epi8"=>["AVX512BW"],
4018
4018
  "_mm512_maskz_abs_epi8"=>["AVX512BW"],
4019
- "_mm_mask_abs_epi8"=>["AVX512VL", "AVX512BW"],
4020
- "_mm_maskz_abs_epi8"=>["AVX512VL", "AVX512BW"],
4021
- "_mm256_mask_abs_epi32"=>["AVX512VL", "AVX512F"],
4022
- "_mm256_maskz_abs_epi32"=>["AVX512VL", "AVX512F"],
4023
- "_mm_mask_abs_epi32"=>["AVX512VL", "AVX512F"],
4024
- "_mm_maskz_abs_epi32"=>["AVX512VL", "AVX512F"],
4025
- "_mm256_abs_epi64"=>["AVX512VL", "AVX512F"],
4026
- "_mm256_mask_abs_epi64"=>["AVX512VL", "AVX512F"],
4027
- "_mm256_maskz_abs_epi64"=>["AVX512VL", "AVX512F"],
4028
- "_mm_abs_epi64"=>["AVX512VL", "AVX512F"],
4029
- "_mm_mask_abs_epi64"=>["AVX512VL", "AVX512F"],
4030
- "_mm_maskz_abs_epi64"=>["AVX512VL", "AVX512F"],
4031
- "_mm256_mask_abs_epi16"=>["AVX512VL", "AVX512BW"],
4032
- "_mm256_maskz_abs_epi16"=>["AVX512VL", "AVX512BW"],
4019
+ "_mm_mask_abs_epi8"=>[["AVX512VL", "AVX512BW"]],
4020
+ "_mm_maskz_abs_epi8"=>[["AVX512VL", "AVX512BW"]],
4021
+ "_mm256_mask_abs_epi32"=>[["AVX512VL", "AVX512F"]],
4022
+ "_mm256_maskz_abs_epi32"=>[["AVX512VL", "AVX512F"]],
4023
+ "_mm_mask_abs_epi32"=>[["AVX512VL", "AVX512F"]],
4024
+ "_mm_maskz_abs_epi32"=>[["AVX512VL", "AVX512F"]],
4025
+ "_mm256_abs_epi64"=>[["AVX512VL", "AVX512F"]],
4026
+ "_mm256_mask_abs_epi64"=>[["AVX512VL", "AVX512F"]],
4027
+ "_mm256_maskz_abs_epi64"=>[["AVX512VL", "AVX512F"]],
4028
+ "_mm_abs_epi64"=>[["AVX512VL", "AVX512F"]],
4029
+ "_mm_mask_abs_epi64"=>[["AVX512VL", "AVX512F"]],
4030
+ "_mm_maskz_abs_epi64"=>[["AVX512VL", "AVX512F"]],
4031
+ "_mm256_mask_abs_epi16"=>[["AVX512VL", "AVX512BW"]],
4032
+ "_mm256_maskz_abs_epi16"=>[["AVX512VL", "AVX512BW"]],
4033
4033
  "_mm512_abs_epi16"=>["AVX512BW"],
4034
4034
  "_mm512_mask_abs_epi16"=>["AVX512BW"],
4035
4035
  "_mm512_maskz_abs_epi16"=>["AVX512BW"],
4036
- "_mm_mask_abs_epi16"=>["AVX512VL", "AVX512BW"],
4037
- "_mm_maskz_abs_epi16"=>["AVX512VL", "AVX512BW"],
4038
- "_mm256_mask_packs_epi32"=>["AVX512VL", "AVX512BW"],
4039
- "_mm256_maskz_packs_epi32"=>["AVX512VL", "AVX512BW"],
4036
+ "_mm_mask_abs_epi16"=>[["AVX512VL", "AVX512BW"]],
4037
+ "_mm_maskz_abs_epi16"=>[["AVX512VL", "AVX512BW"]],
4038
+ "_mm256_mask_packs_epi32"=>[["AVX512VL", "AVX512BW"]],
4039
+ "_mm256_maskz_packs_epi32"=>[["AVX512VL", "AVX512BW"]],
4040
4040
  "_mm512_mask_packs_epi32"=>["AVX512BW"],
4041
4041
  "_mm512_maskz_packs_epi32"=>["AVX512BW"],
4042
4042
  "_mm512_packs_epi32"=>["AVX512BW"],
4043
- "_mm_mask_packs_epi32"=>["AVX512VL", "AVX512BW"],
4044
- "_mm_maskz_packs_epi32"=>["AVX512VL", "AVX512BW"],
4045
- "_mm256_mask_packs_epi16"=>["AVX512VL", "AVX512BW"],
4046
- "_mm256_maskz_packs_epi16"=>["AVX512VL", "AVX512BW"],
4043
+ "_mm_mask_packs_epi32"=>[["AVX512VL", "AVX512BW"]],
4044
+ "_mm_maskz_packs_epi32"=>[["AVX512VL", "AVX512BW"]],
4045
+ "_mm256_mask_packs_epi16"=>[["AVX512VL", "AVX512BW"]],
4046
+ "_mm256_maskz_packs_epi16"=>[["AVX512VL", "AVX512BW"]],
4047
4047
  "_mm512_mask_packs_epi16"=>["AVX512BW"],
4048
4048
  "_mm512_maskz_packs_epi16"=>["AVX512BW"],
4049
4049
  "_mm512_packs_epi16"=>["AVX512BW"],
4050
- "_mm_mask_packs_epi16"=>["AVX512VL", "AVX512BW"],
4051
- "_mm_maskz_packs_epi16"=>["AVX512VL", "AVX512BW"],
4052
- "_mm256_mask_packus_epi32"=>["AVX512VL", "AVX512BW"],
4053
- "_mm256_maskz_packus_epi32"=>["AVX512VL", "AVX512BW"],
4050
+ "_mm_mask_packs_epi16"=>[["AVX512VL", "AVX512BW"]],
4051
+ "_mm_maskz_packs_epi16"=>[["AVX512VL", "AVX512BW"]],
4052
+ "_mm256_mask_packus_epi32"=>[["AVX512VL", "AVX512BW"]],
4053
+ "_mm256_maskz_packus_epi32"=>[["AVX512VL", "AVX512BW"]],
4054
4054
  "_mm512_mask_packus_epi32"=>["AVX512BW"],
4055
4055
  "_mm512_maskz_packus_epi32"=>["AVX512BW"],
4056
4056
  "_mm512_packus_epi32"=>["AVX512BW"],
4057
- "_mm_mask_packus_epi32"=>["AVX512VL", "AVX512BW"],
4058
- "_mm_maskz_packus_epi32"=>["AVX512VL", "AVX512BW"],
4059
- "_mm256_mask_packus_epi16"=>["AVX512VL", "AVX512BW"],
4060
- "_mm256_maskz_packus_epi16"=>["AVX512VL", "AVX512BW"],
4057
+ "_mm_mask_packus_epi32"=>[["AVX512VL", "AVX512BW"]],
4058
+ "_mm_maskz_packus_epi32"=>[["AVX512VL", "AVX512BW"]],
4059
+ "_mm256_mask_packus_epi16"=>[["AVX512VL", "AVX512BW"]],
4060
+ "_mm256_maskz_packus_epi16"=>[["AVX512VL", "AVX512BW"]],
4061
4061
  "_mm512_mask_packus_epi16"=>["AVX512BW"],
4062
4062
  "_mm512_maskz_packus_epi16"=>["AVX512BW"],
4063
4063
  "_mm512_packus_epi16"=>["AVX512BW"],
4064
- "_mm_mask_packus_epi16"=>["AVX512VL", "AVX512BW"],
4065
- "_mm_maskz_packus_epi16"=>["AVX512VL", "AVX512BW"],
4066
- "_mm256_mask_add_epi8"=>["AVX512VL", "AVX512BW"],
4067
- "_mm256_maskz_add_epi8"=>["AVX512VL", "AVX512BW"],
4064
+ "_mm_mask_packus_epi16"=>[["AVX512VL", "AVX512BW"]],
4065
+ "_mm_maskz_packus_epi16"=>[["AVX512VL", "AVX512BW"]],
4066
+ "_mm256_mask_add_epi8"=>[["AVX512VL", "AVX512BW"]],
4067
+ "_mm256_maskz_add_epi8"=>[["AVX512VL", "AVX512BW"]],
4068
4068
  "_mm512_add_epi8"=>["AVX512BW"],
4069
4069
  "_mm512_mask_add_epi8"=>["AVX512BW"],
4070
4070
  "_mm512_maskz_add_epi8"=>["AVX512BW"],
4071
- "_mm_mask_add_epi8"=>["AVX512VL", "AVX512BW"],
4072
- "_mm_maskz_add_epi8"=>["AVX512VL", "AVX512BW"],
4073
- "_mm256_mask_add_epi32"=>["AVX512VL", "AVX512F"],
4074
- "_mm256_maskz_add_epi32"=>["AVX512VL", "AVX512F"],
4075
- "_mm_mask_add_epi32"=>["AVX512VL", "AVX512F"],
4076
- "_mm_maskz_add_epi32"=>["AVX512VL", "AVX512F"],
4077
- "_mm256_mask_add_epi64"=>["AVX512VL", "AVX512F"],
4078
- "_mm256_maskz_add_epi64"=>["AVX512VL", "AVX512F"],
4079
- "_mm_mask_add_epi64"=>["AVX512VL", "AVX512F"],
4080
- "_mm_maskz_add_epi64"=>["AVX512VL", "AVX512F"],
4081
- "_mm256_mask_adds_epi8"=>["AVX512VL", "AVX512BW"],
4082
- "_mm256_maskz_adds_epi8"=>["AVX512VL", "AVX512BW"],
4071
+ "_mm_mask_add_epi8"=>[["AVX512VL", "AVX512BW"]],
4072
+ "_mm_maskz_add_epi8"=>[["AVX512VL", "AVX512BW"]],
4073
+ "_mm256_mask_add_epi32"=>[["AVX512VL", "AVX512F"]],
4074
+ "_mm256_maskz_add_epi32"=>[["AVX512VL", "AVX512F"]],
4075
+ "_mm_mask_add_epi32"=>[["AVX512VL", "AVX512F"]],
4076
+ "_mm_maskz_add_epi32"=>[["AVX512VL", "AVX512F"]],
4077
+ "_mm256_mask_add_epi64"=>[["AVX512VL", "AVX512F"]],
4078
+ "_mm256_maskz_add_epi64"=>[["AVX512VL", "AVX512F"]],
4079
+ "_mm_mask_add_epi64"=>[["AVX512VL", "AVX512F"]],
4080
+ "_mm_maskz_add_epi64"=>[["AVX512VL", "AVX512F"]],
4081
+ "_mm256_mask_adds_epi8"=>[["AVX512VL", "AVX512BW"]],
4082
+ "_mm256_maskz_adds_epi8"=>[["AVX512VL", "AVX512BW"]],
4083
4083
  "_mm512_adds_epi8"=>["AVX512BW"],
4084
4084
  "_mm512_mask_adds_epi8"=>["AVX512BW"],
4085
4085
  "_mm512_maskz_adds_epi8"=>["AVX512BW"],
4086
- "_mm_mask_adds_epi8"=>["AVX512VL", "AVX512BW"],
4087
- "_mm_maskz_adds_epi8"=>["AVX512VL", "AVX512BW"],
4088
- "_mm256_mask_adds_epi16"=>["AVX512VL", "AVX512BW"],
4089
- "_mm256_maskz_adds_epi16"=>["AVX512VL", "AVX512BW"],
4086
+ "_mm_mask_adds_epi8"=>[["AVX512VL", "AVX512BW"]],
4087
+ "_mm_maskz_adds_epi8"=>[["AVX512VL", "AVX512BW"]],
4088
+ "_mm256_mask_adds_epi16"=>[["AVX512VL", "AVX512BW"]],
4089
+ "_mm256_maskz_adds_epi16"=>[["AVX512VL", "AVX512BW"]],
4090
4090
  "_mm512_adds_epi16"=>["AVX512BW"],
4091
4091
  "_mm512_mask_adds_epi16"=>["AVX512BW"],
4092
4092
  "_mm512_maskz_adds_epi16"=>["AVX512BW"],
4093
- "_mm_mask_adds_epi16"=>["AVX512VL", "AVX512BW"],
4094
- "_mm_maskz_adds_epi16"=>["AVX512VL", "AVX512BW"],
4095
- "_mm256_mask_adds_epu8"=>["AVX512VL", "AVX512BW"],
4096
- "_mm256_maskz_adds_epu8"=>["AVX512VL", "AVX512BW"],
4093
+ "_mm_mask_adds_epi16"=>[["AVX512VL", "AVX512BW"]],
4094
+ "_mm_maskz_adds_epi16"=>[["AVX512VL", "AVX512BW"]],
4095
+ "_mm256_mask_adds_epu8"=>[["AVX512VL", "AVX512BW"]],
4096
+ "_mm256_maskz_adds_epu8"=>[["AVX512VL", "AVX512BW"]],
4097
4097
  "_mm512_adds_epu8"=>["AVX512BW"],
4098
4098
  "_mm512_mask_adds_epu8"=>["AVX512BW"],
4099
4099
  "_mm512_maskz_adds_epu8"=>["AVX512BW"],
4100
- "_mm_mask_adds_epu8"=>["AVX512VL", "AVX512BW"],
4101
- "_mm_maskz_adds_epu8"=>["AVX512VL", "AVX512BW"],
4102
- "_mm256_mask_adds_epu16"=>["AVX512VL", "AVX512BW"],
4103
- "_mm256_maskz_adds_epu16"=>["AVX512VL", "AVX512BW"],
4100
+ "_mm_mask_adds_epu8"=>[["AVX512VL", "AVX512BW"]],
4101
+ "_mm_maskz_adds_epu8"=>[["AVX512VL", "AVX512BW"]],
4102
+ "_mm256_mask_adds_epu16"=>[["AVX512VL", "AVX512BW"]],
4103
+ "_mm256_maskz_adds_epu16"=>[["AVX512VL", "AVX512BW"]],
4104
4104
  "_mm512_adds_epu16"=>["AVX512BW"],
4105
4105
  "_mm512_mask_adds_epu16"=>["AVX512BW"],
4106
4106
  "_mm512_maskz_adds_epu16"=>["AVX512BW"],
4107
- "_mm_mask_adds_epu16"=>["AVX512VL", "AVX512BW"],
4108
- "_mm_maskz_adds_epu16"=>["AVX512VL", "AVX512BW"],
4109
- "_mm256_mask_add_epi16"=>["AVX512VL", "AVX512BW"],
4110
- "_mm256_maskz_add_epi16"=>["AVX512VL", "AVX512BW"],
4107
+ "_mm_mask_adds_epu16"=>[["AVX512VL", "AVX512BW"]],
4108
+ "_mm_maskz_adds_epu16"=>[["AVX512VL", "AVX512BW"]],
4109
+ "_mm256_mask_add_epi16"=>[["AVX512VL", "AVX512BW"]],
4110
+ "_mm256_maskz_add_epi16"=>[["AVX512VL", "AVX512BW"]],
4111
4111
  "_mm512_add_epi16"=>["AVX512BW"],
4112
4112
  "_mm512_mask_add_epi16"=>["AVX512BW"],
4113
4113
  "_mm512_maskz_add_epi16"=>["AVX512BW"],
4114
- "_mm_mask_add_epi16"=>["AVX512VL", "AVX512BW"],
4115
- "_mm_maskz_add_epi16"=>["AVX512VL", "AVX512BW"],
4116
- "_mm256_mask_alignr_epi8"=>["AVX512VL", "AVX512BW"],
4117
- "_mm256_maskz_alignr_epi8"=>["AVX512VL", "AVX512BW"],
4114
+ "_mm_mask_add_epi16"=>[["AVX512VL", "AVX512BW"]],
4115
+ "_mm_maskz_add_epi16"=>[["AVX512VL", "AVX512BW"]],
4116
+ "_mm256_mask_alignr_epi8"=>[["AVX512VL", "AVX512BW"]],
4117
+ "_mm256_maskz_alignr_epi8"=>[["AVX512VL", "AVX512BW"]],
4118
4118
  "_mm512_alignr_epi8"=>["AVX512BW"],
4119
4119
  "_mm512_mask_alignr_epi8"=>["AVX512BW"],
4120
4120
  "_mm512_maskz_alignr_epi8"=>["AVX512BW"],
4121
- "_mm_mask_alignr_epi8"=>["AVX512VL", "AVX512BW"],
4122
- "_mm_maskz_alignr_epi8"=>["AVX512VL", "AVX512BW"],
4123
- "_mm256_mask_and_epi32"=>["AVX512VL", "AVX512F"],
4124
- "_mm256_maskz_and_epi32"=>["AVX512VL", "AVX512F"],
4125
- "_mm_mask_and_epi32"=>["AVX512VL", "AVX512F"],
4126
- "_mm_maskz_and_epi32"=>["AVX512VL", "AVX512F"],
4127
- "_mm256_mask_andnot_epi32"=>["AVX512VL", "AVX512F"],
4128
- "_mm256_maskz_andnot_epi32"=>["AVX512VL", "AVX512F"],
4129
- "_mm_mask_andnot_epi32"=>["AVX512VL", "AVX512F"],
4130
- "_mm_maskz_andnot_epi32"=>["AVX512VL", "AVX512F"],
4131
- "_mm256_mask_andnot_epi64"=>["AVX512VL", "AVX512F"],
4132
- "_mm256_maskz_andnot_epi64"=>["AVX512VL", "AVX512F"],
4133
- "_mm_mask_andnot_epi64"=>["AVX512VL", "AVX512F"],
4134
- "_mm_maskz_andnot_epi64"=>["AVX512VL", "AVX512F"],
4135
- "_mm256_mask_and_epi64"=>["AVX512VL", "AVX512F"],
4136
- "_mm256_maskz_and_epi64"=>["AVX512VL", "AVX512F"],
4137
- "_mm_mask_and_epi64"=>["AVX512VL", "AVX512F"],
4138
- "_mm_maskz_and_epi64"=>["AVX512VL", "AVX512F"],
4139
- "_mm256_mask_avg_epu8"=>["AVX512VL", "AVX512BW"],
4140
- "_mm256_maskz_avg_epu8"=>["AVX512VL", "AVX512BW"],
4121
+ "_mm_mask_alignr_epi8"=>[["AVX512VL", "AVX512BW"]],
4122
+ "_mm_maskz_alignr_epi8"=>[["AVX512VL", "AVX512BW"]],
4123
+ "_mm256_mask_and_epi32"=>[["AVX512VL", "AVX512F"]],
4124
+ "_mm256_maskz_and_epi32"=>[["AVX512VL", "AVX512F"]],
4125
+ "_mm_mask_and_epi32"=>[["AVX512VL", "AVX512F"]],
4126
+ "_mm_maskz_and_epi32"=>[["AVX512VL", "AVX512F"]],
4127
+ "_mm256_mask_andnot_epi32"=>[["AVX512VL", "AVX512F"]],
4128
+ "_mm256_maskz_andnot_epi32"=>[["AVX512VL", "AVX512F"]],
4129
+ "_mm_mask_andnot_epi32"=>[["AVX512VL", "AVX512F"]],
4130
+ "_mm_maskz_andnot_epi32"=>[["AVX512VL", "AVX512F"]],
4131
+ "_mm256_mask_andnot_epi64"=>[["AVX512VL", "AVX512F"]],
4132
+ "_mm256_maskz_andnot_epi64"=>[["AVX512VL", "AVX512F"]],
4133
+ "_mm_mask_andnot_epi64"=>[["AVX512VL", "AVX512F"]],
4134
+ "_mm_maskz_andnot_epi64"=>[["AVX512VL", "AVX512F"]],
4135
+ "_mm256_mask_and_epi64"=>[["AVX512VL", "AVX512F"]],
4136
+ "_mm256_maskz_and_epi64"=>[["AVX512VL", "AVX512F"]],
4137
+ "_mm_mask_and_epi64"=>[["AVX512VL", "AVX512F"]],
4138
+ "_mm_maskz_and_epi64"=>[["AVX512VL", "AVX512F"]],
4139
+ "_mm256_mask_avg_epu8"=>[["AVX512VL", "AVX512BW"]],
4140
+ "_mm256_maskz_avg_epu8"=>[["AVX512VL", "AVX512BW"]],
4141
4141
  "_mm512_avg_epu8"=>["AVX512BW"],
4142
4142
  "_mm512_mask_avg_epu8"=>["AVX512BW"],
4143
4143
  "_mm512_maskz_avg_epu8"=>["AVX512BW"],
4144
- "_mm_mask_avg_epu8"=>["AVX512VL", "AVX512BW"],
4145
- "_mm_maskz_avg_epu8"=>["AVX512VL", "AVX512BW"],
4146
- "_mm256_mask_avg_epu16"=>["AVX512VL", "AVX512BW"],
4147
- "_mm256_maskz_avg_epu16"=>["AVX512VL", "AVX512BW"],
4144
+ "_mm_mask_avg_epu8"=>[["AVX512VL", "AVX512BW"]],
4145
+ "_mm_maskz_avg_epu8"=>[["AVX512VL", "AVX512BW"]],
4146
+ "_mm256_mask_avg_epu16"=>[["AVX512VL", "AVX512BW"]],
4147
+ "_mm256_maskz_avg_epu16"=>[["AVX512VL", "AVX512BW"]],
4148
4148
  "_mm512_avg_epu16"=>["AVX512BW"],
4149
4149
  "_mm512_mask_avg_epu16"=>["AVX512BW"],
4150
4150
  "_mm512_maskz_avg_epu16"=>["AVX512BW"],
4151
- "_mm_mask_avg_epu16"=>["AVX512VL", "AVX512BW"],
4152
- "_mm_maskz_avg_epu16"=>["AVX512VL", "AVX512BW"],
4153
- "_mm256_mask_blend_epi8"=>["AVX512VL", "AVX512BW"],
4151
+ "_mm_mask_avg_epu16"=>[["AVX512VL", "AVX512BW"]],
4152
+ "_mm_maskz_avg_epu16"=>[["AVX512VL", "AVX512BW"]],
4153
+ "_mm256_mask_blend_epi8"=>[["AVX512VL", "AVX512BW"]],
4154
4154
  "_mm512_mask_blend_epi8"=>["AVX512BW"],
4155
- "_mm_mask_blend_epi8"=>["AVX512VL", "AVX512BW"],
4156
- "_mm256_mask_blend_epi32"=>["AVX512VL", "AVX512F"],
4157
- "_mm_mask_blend_epi32"=>["AVX512VL", "AVX512F"],
4158
- "_mm256_mask_blend_epi64"=>["AVX512VL", "AVX512F"],
4159
- "_mm_mask_blend_epi64"=>["AVX512VL", "AVX512F"],
4160
- "_mm256_mask_blend_epi16"=>["AVX512VL", "AVX512BW"],
4155
+ "_mm_mask_blend_epi8"=>[["AVX512VL", "AVX512BW"]],
4156
+ "_mm256_mask_blend_epi32"=>[["AVX512VL", "AVX512F"]],
4157
+ "_mm_mask_blend_epi32"=>[["AVX512VL", "AVX512F"]],
4158
+ "_mm256_mask_blend_epi64"=>[["AVX512VL", "AVX512F"]],
4159
+ "_mm_mask_blend_epi64"=>[["AVX512VL", "AVX512F"]],
4160
+ "_mm256_mask_blend_epi16"=>[["AVX512VL", "AVX512BW"]],
4161
4161
  "_mm512_mask_blend_epi16"=>["AVX512BW"],
4162
- "_mm_mask_blend_epi16"=>["AVX512VL", "AVX512BW"],
4163
- "_mm256_mask_broadcastb_epi8"=>["AVX512VL", "AVX512BW"],
4164
- "_mm256_mask_set1_epi8"=>["AVX512VL", "AVX512BW"],
4165
- "_mm256_maskz_broadcastb_epi8"=>["AVX512VL", "AVX512BW"],
4166
- "_mm256_maskz_set1_epi8"=>["AVX512VL", "AVX512BW"],
4162
+ "_mm_mask_blend_epi16"=>[["AVX512VL", "AVX512BW"]],
4163
+ "_mm256_mask_broadcastb_epi8"=>[["AVX512VL", "AVX512BW"]],
4164
+ "_mm256_mask_set1_epi8"=>[["AVX512VL", "AVX512BW"]],
4165
+ "_mm256_maskz_broadcastb_epi8"=>[["AVX512VL", "AVX512BW"]],
4166
+ "_mm256_maskz_set1_epi8"=>[["AVX512VL", "AVX512BW"]],
4167
4167
  "_mm512_broadcastb_epi8"=>["AVX512BW"],
4168
4168
  "_mm512_mask_broadcastb_epi8"=>["AVX512BW"],
4169
4169
  "_mm512_mask_set1_epi8"=>["AVX512BW"],
4170
4170
  "_mm512_maskz_broadcastb_epi8"=>["AVX512BW"],
4171
4171
  "_mm512_maskz_set1_epi8"=>["AVX512BW"],
4172
- "_mm_mask_broadcastb_epi8"=>["AVX512VL", "AVX512BW"],
4173
- "_mm_mask_set1_epi8"=>["AVX512VL", "AVX512BW"],
4174
- "_mm_maskz_broadcastb_epi8"=>["AVX512VL", "AVX512BW"],
4175
- "_mm_maskz_set1_epi8"=>["AVX512VL", "AVX512BW"],
4176
- "_mm256_mask_broadcastd_epi32"=>["AVX512VL", "AVX512F"],
4177
- "_mm256_mask_set1_epi32"=>["AVX512VL", "AVX512F"],
4178
- "_mm256_maskz_broadcastd_epi32"=>["AVX512VL", "AVX512F"],
4179
- "_mm256_maskz_set1_epi32"=>["AVX512VL", "AVX512F"],
4180
- "_mm_mask_broadcastd_epi32"=>["AVX512VL", "AVX512F"],
4181
- "_mm_mask_set1_epi32"=>["AVX512VL", "AVX512F"],
4182
- "_mm_maskz_broadcastd_epi32"=>["AVX512VL", "AVX512F"],
4183
- "_mm_maskz_set1_epi32"=>["AVX512VL", "AVX512F"],
4184
- "_mm256_broadcastmb_epi64"=>["AVX512VL", "AVX512CD"],
4185
- "_mm_broadcastmb_epi64"=>["AVX512VL", "AVX512CD"],
4186
- "_mm256_broadcastmw_epi32"=>["AVX512VL", "AVX512CD"],
4187
- "_mm_broadcastmw_epi32"=>["AVX512VL", "AVX512CD"],
4188
- "_mm256_mask_broadcastq_epi64"=>["AVX512VL", "AVX512F"],
4189
- "_mm256_mask_set1_epi64"=>["AVX512VL", "AVX512F"],
4190
- "_mm256_maskz_broadcastq_epi64"=>["AVX512VL", "AVX512F"],
4191
- "_mm256_maskz_set1_epi64"=>["AVX512VL", "AVX512F"],
4192
- "_mm_mask_broadcastq_epi64"=>["AVX512VL", "AVX512F"],
4193
- "_mm_mask_set1_epi64"=>["AVX512VL", "AVX512F"],
4194
- "_mm_maskz_broadcastq_epi64"=>["AVX512VL", "AVX512F"],
4195
- "_mm_maskz_set1_epi64"=>["AVX512VL", "AVX512F"],
4196
- "_mm256_mask_broadcastw_epi16"=>["AVX512VL", "AVX512BW"],
4197
- "_mm256_mask_set1_epi16"=>["AVX512VL", "AVX512BW"],
4198
- "_mm256_maskz_broadcastw_epi16"=>["AVX512VL", "AVX512BW"],
4199
- "_mm256_maskz_set1_epi16"=>["AVX512VL", "AVX512BW"],
4172
+ "_mm_mask_broadcastb_epi8"=>[["AVX512VL", "AVX512BW"]],
4173
+ "_mm_mask_set1_epi8"=>[["AVX512VL", "AVX512BW"]],
4174
+ "_mm_maskz_broadcastb_epi8"=>[["AVX512VL", "AVX512BW"]],
4175
+ "_mm_maskz_set1_epi8"=>[["AVX512VL", "AVX512BW"]],
4176
+ "_mm256_mask_broadcastd_epi32"=>[["AVX512VL", "AVX512F"]],
4177
+ "_mm256_mask_set1_epi32"=>[["AVX512VL", "AVX512F"]],
4178
+ "_mm256_maskz_broadcastd_epi32"=>[["AVX512VL", "AVX512F"]],
4179
+ "_mm256_maskz_set1_epi32"=>[["AVX512VL", "AVX512F"]],
4180
+ "_mm_mask_broadcastd_epi32"=>[["AVX512VL", "AVX512F"]],
4181
+ "_mm_mask_set1_epi32"=>[["AVX512VL", "AVX512F"]],
4182
+ "_mm_maskz_broadcastd_epi32"=>[["AVX512VL", "AVX512F"]],
4183
+ "_mm_maskz_set1_epi32"=>[["AVX512VL", "AVX512F"]],
4184
+ "_mm256_broadcastmb_epi64"=>[["AVX512VL", "AVX512CD"]],
4185
+ "_mm_broadcastmb_epi64"=>[["AVX512VL", "AVX512CD"]],
4186
+ "_mm256_broadcastmw_epi32"=>[["AVX512VL", "AVX512CD"]],
4187
+ "_mm_broadcastmw_epi32"=>[["AVX512VL", "AVX512CD"]],
4188
+ "_mm256_mask_broadcastq_epi64"=>[["AVX512VL", "AVX512F"]],
4189
+ "_mm256_mask_set1_epi64"=>[["AVX512VL", "AVX512F"]],
4190
+ "_mm256_maskz_broadcastq_epi64"=>[["AVX512VL", "AVX512F"]],
4191
+ "_mm256_maskz_set1_epi64"=>[["AVX512VL", "AVX512F"]],
4192
+ "_mm_mask_broadcastq_epi64"=>[["AVX512VL", "AVX512F"]],
4193
+ "_mm_mask_set1_epi64"=>[["AVX512VL", "AVX512F"]],
4194
+ "_mm_maskz_broadcastq_epi64"=>[["AVX512VL", "AVX512F"]],
4195
+ "_mm_maskz_set1_epi64"=>[["AVX512VL", "AVX512F"]],
4196
+ "_mm256_mask_broadcastw_epi16"=>[["AVX512VL", "AVX512BW"]],
4197
+ "_mm256_mask_set1_epi16"=>[["AVX512VL", "AVX512BW"]],
4198
+ "_mm256_maskz_broadcastw_epi16"=>[["AVX512VL", "AVX512BW"]],
4199
+ "_mm256_maskz_set1_epi16"=>[["AVX512VL", "AVX512BW"]],
4200
4200
  "_mm512_broadcastw_epi16"=>["AVX512BW"],
4201
4201
  "_mm512_mask_broadcastw_epi16"=>["AVX512BW"],
4202
4202
  "_mm512_mask_set1_epi16"=>["AVX512BW"],
4203
4203
  "_mm512_maskz_broadcastw_epi16"=>["AVX512BW"],
4204
4204
  "_mm512_maskz_set1_epi16"=>["AVX512BW"],
4205
- "_mm_mask_broadcastw_epi16"=>["AVX512VL", "AVX512BW"],
4206
- "_mm_mask_set1_epi16"=>["AVX512VL", "AVX512BW"],
4207
- "_mm_maskz_broadcastw_epi16"=>["AVX512VL", "AVX512BW"],
4208
- "_mm_maskz_set1_epi16"=>["AVX512VL", "AVX512BW"],
4209
- "_mm256_cmp_epi8_mask"=>["AVX512VL", "AVX512BW"],
4210
- "_mm256_cmpeq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4211
- "_mm256_cmpge_epi8_mask"=>["AVX512VL", "AVX512BW"],
4212
- "_mm256_cmpgt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4213
- "_mm256_cmple_epi8_mask"=>["AVX512VL", "AVX512BW"],
4214
- "_mm256_cmplt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4215
- "_mm256_cmpneq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4216
- "_mm256_mask_cmp_epi8_mask"=>["AVX512VL", "AVX512BW"],
4217
- "_mm256_mask_cmpeq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4218
- "_mm256_mask_cmpge_epi8_mask"=>["AVX512VL", "AVX512BW"],
4219
- "_mm256_mask_cmpgt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4220
- "_mm256_mask_cmple_epi8_mask"=>["AVX512VL", "AVX512BW"],
4221
- "_mm256_mask_cmplt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4222
- "_mm256_mask_cmpneq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4205
+ "_mm_mask_broadcastw_epi16"=>[["AVX512VL", "AVX512BW"]],
4206
+ "_mm_mask_set1_epi16"=>[["AVX512VL", "AVX512BW"]],
4207
+ "_mm_maskz_broadcastw_epi16"=>[["AVX512VL", "AVX512BW"]],
4208
+ "_mm_maskz_set1_epi16"=>[["AVX512VL", "AVX512BW"]],
4209
+ "_mm256_cmp_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4210
+ "_mm256_cmpeq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4211
+ "_mm256_cmpge_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4212
+ "_mm256_cmpgt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4213
+ "_mm256_cmple_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4214
+ "_mm256_cmplt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4215
+ "_mm256_cmpneq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4216
+ "_mm256_mask_cmp_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4217
+ "_mm256_mask_cmpeq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4218
+ "_mm256_mask_cmpge_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4219
+ "_mm256_mask_cmpgt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4220
+ "_mm256_mask_cmple_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4221
+ "_mm256_mask_cmplt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4222
+ "_mm256_mask_cmpneq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4223
4223
  "_mm512_cmp_epi8_mask"=>["AVX512BW"],
4224
4224
  "_mm512_cmpeq_epi8_mask"=>["AVX512BW"],
4225
4225
  "_mm512_cmpge_epi8_mask"=>["AVX512BW"],
@@ -4234,90 +4234,90 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
4234
4234
  "_mm512_mask_cmple_epi8_mask"=>["AVX512BW"],
4235
4235
  "_mm512_mask_cmplt_epi8_mask"=>["AVX512BW"],
4236
4236
  "_mm512_mask_cmpneq_epi8_mask"=>["AVX512BW"],
4237
- "_mm_cmp_epi8_mask"=>["AVX512VL", "AVX512BW"],
4238
- "_mm_cmpeq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4239
- "_mm_cmpge_epi8_mask"=>["AVX512VL", "AVX512BW"],
4240
- "_mm_cmpgt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4241
- "_mm_cmple_epi8_mask"=>["AVX512VL", "AVX512BW"],
4242
- "_mm_cmplt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4243
- "_mm_cmpneq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4244
- "_mm_mask_cmp_epi8_mask"=>["AVX512VL", "AVX512BW"],
4245
- "_mm_mask_cmpeq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4246
- "_mm_mask_cmpge_epi8_mask"=>["AVX512VL", "AVX512BW"],
4247
- "_mm_mask_cmpgt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4248
- "_mm_mask_cmple_epi8_mask"=>["AVX512VL", "AVX512BW"],
4249
- "_mm_mask_cmplt_epi8_mask"=>["AVX512VL", "AVX512BW"],
4250
- "_mm_mask_cmpneq_epi8_mask"=>["AVX512VL", "AVX512BW"],
4251
- "_mm256_cmp_epi32_mask"=>["AVX512VL", "AVX512F"],
4252
- "_mm256_cmpeq_epi32_mask"=>["AVX512VL", "AVX512F"],
4253
- "_mm256_cmpge_epi32_mask"=>["AVX512VL", "AVX512F"],
4254
- "_mm256_cmpgt_epi32_mask"=>["AVX512VL", "AVX512F"],
4255
- "_mm256_cmple_epi32_mask"=>["AVX512VL", "AVX512F"],
4256
- "_mm256_cmplt_epi32_mask"=>["AVX512VL", "AVX512F"],
4257
- "_mm256_cmpneq_epi32_mask"=>["AVX512VL", "AVX512F"],
4258
- "_mm256_mask_cmp_epi32_mask"=>["AVX512VL", "AVX512F"],
4259
- "_mm256_mask_cmpeq_epi32_mask"=>["AVX512VL", "AVX512F"],
4260
- "_mm256_mask_cmpge_epi32_mask"=>["AVX512VL", "AVX512F"],
4261
- "_mm256_mask_cmpgt_epi32_mask"=>["AVX512VL", "AVX512F"],
4262
- "_mm256_mask_cmple_epi32_mask"=>["AVX512VL", "AVX512F"],
4263
- "_mm256_mask_cmplt_epi32_mask"=>["AVX512VL", "AVX512F"],
4264
- "_mm256_mask_cmpneq_epi32_mask"=>["AVX512VL", "AVX512F"],
4265
- "_mm_cmp_epi32_mask"=>["AVX512VL", "AVX512F"],
4266
- "_mm_cmpeq_epi32_mask"=>["AVX512VL", "AVX512F"],
4267
- "_mm_cmpge_epi32_mask"=>["AVX512VL", "AVX512F"],
4268
- "_mm_cmpgt_epi32_mask"=>["AVX512VL", "AVX512F"],
4269
- "_mm_cmple_epi32_mask"=>["AVX512VL", "AVX512F"],
4270
- "_mm_cmplt_epi32_mask"=>["AVX512VL", "AVX512F"],
4271
- "_mm_cmpneq_epi32_mask"=>["AVX512VL", "AVX512F"],
4272
- "_mm_mask_cmp_epi32_mask"=>["AVX512VL", "AVX512F"],
4273
- "_mm_mask_cmpeq_epi32_mask"=>["AVX512VL", "AVX512F"],
4274
- "_mm_mask_cmpge_epi32_mask"=>["AVX512VL", "AVX512F"],
4275
- "_mm_mask_cmpgt_epi32_mask"=>["AVX512VL", "AVX512F"],
4276
- "_mm_mask_cmple_epi32_mask"=>["AVX512VL", "AVX512F"],
4277
- "_mm_mask_cmplt_epi32_mask"=>["AVX512VL", "AVX512F"],
4278
- "_mm_mask_cmpneq_epi32_mask"=>["AVX512VL", "AVX512F"],
4279
- "_mm256_cmp_epi64_mask"=>["AVX512VL", "AVX512F"],
4280
- "_mm256_cmpeq_epi64_mask"=>["AVX512VL", "AVX512F"],
4281
- "_mm256_cmpge_epi64_mask"=>["AVX512VL", "AVX512F"],
4282
- "_mm256_cmpgt_epi64_mask"=>["AVX512VL", "AVX512F"],
4283
- "_mm256_cmple_epi64_mask"=>["AVX512VL", "AVX512F"],
4284
- "_mm256_cmplt_epi64_mask"=>["AVX512VL", "AVX512F"],
4285
- "_mm256_cmpneq_epi64_mask"=>["AVX512VL", "AVX512F"],
4286
- "_mm256_mask_cmp_epi64_mask"=>["AVX512VL", "AVX512F"],
4287
- "_mm256_mask_cmpeq_epi64_mask"=>["AVX512VL", "AVX512F"],
4288
- "_mm256_mask_cmpge_epi64_mask"=>["AVX512VL", "AVX512F"],
4289
- "_mm256_mask_cmpgt_epi64_mask"=>["AVX512VL", "AVX512F"],
4290
- "_mm256_mask_cmple_epi64_mask"=>["AVX512VL", "AVX512F"],
4291
- "_mm256_mask_cmplt_epi64_mask"=>["AVX512VL", "AVX512F"],
4292
- "_mm256_mask_cmpneq_epi64_mask"=>["AVX512VL", "AVX512F"],
4293
- "_mm_cmp_epi64_mask"=>["AVX512VL", "AVX512F"],
4294
- "_mm_cmpeq_epi64_mask"=>["AVX512VL", "AVX512F"],
4295
- "_mm_cmpge_epi64_mask"=>["AVX512VL", "AVX512F"],
4296
- "_mm_cmpgt_epi64_mask"=>["AVX512VL", "AVX512F"],
4297
- "_mm_cmple_epi64_mask"=>["AVX512VL", "AVX512F"],
4298
- "_mm_cmplt_epi64_mask"=>["AVX512VL", "AVX512F"],
4299
- "_mm_cmpneq_epi64_mask"=>["AVX512VL", "AVX512F"],
4300
- "_mm_mask_cmp_epi64_mask"=>["AVX512VL", "AVX512F"],
4301
- "_mm_mask_cmpeq_epi64_mask"=>["AVX512VL", "AVX512F"],
4302
- "_mm_mask_cmpge_epi64_mask"=>["AVX512VL", "AVX512F"],
4303
- "_mm_mask_cmpgt_epi64_mask"=>["AVX512VL", "AVX512F"],
4304
- "_mm_mask_cmple_epi64_mask"=>["AVX512VL", "AVX512F"],
4305
- "_mm_mask_cmplt_epi64_mask"=>["AVX512VL", "AVX512F"],
4306
- "_mm_mask_cmpneq_epi64_mask"=>["AVX512VL", "AVX512F"],
4307
- "_mm256_cmp_epu8_mask"=>["AVX512VL", "AVX512BW"],
4308
- "_mm256_cmpeq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4309
- "_mm256_cmpge_epu8_mask"=>["AVX512VL", "AVX512BW"],
4310
- "_mm256_cmpgt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4311
- "_mm256_cmple_epu8_mask"=>["AVX512VL", "AVX512BW"],
4312
- "_mm256_cmplt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4313
- "_mm256_cmpneq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4314
- "_mm256_mask_cmp_epu8_mask"=>["AVX512VL", "AVX512BW"],
4315
- "_mm256_mask_cmpeq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4316
- "_mm256_mask_cmpge_epu8_mask"=>["AVX512VL", "AVX512BW"],
4317
- "_mm256_mask_cmpgt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4318
- "_mm256_mask_cmple_epu8_mask"=>["AVX512VL", "AVX512BW"],
4319
- "_mm256_mask_cmplt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4320
- "_mm256_mask_cmpneq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4237
+ "_mm_cmp_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4238
+ "_mm_cmpeq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4239
+ "_mm_cmpge_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4240
+ "_mm_cmpgt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4241
+ "_mm_cmple_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4242
+ "_mm_cmplt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4243
+ "_mm_cmpneq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4244
+ "_mm_mask_cmp_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4245
+ "_mm_mask_cmpeq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4246
+ "_mm_mask_cmpge_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4247
+ "_mm_mask_cmpgt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4248
+ "_mm_mask_cmple_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4249
+ "_mm_mask_cmplt_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4250
+ "_mm_mask_cmpneq_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
4251
+ "_mm256_cmp_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4252
+ "_mm256_cmpeq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4253
+ "_mm256_cmpge_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4254
+ "_mm256_cmpgt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4255
+ "_mm256_cmple_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4256
+ "_mm256_cmplt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4257
+ "_mm256_cmpneq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4258
+ "_mm256_mask_cmp_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4259
+ "_mm256_mask_cmpeq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4260
+ "_mm256_mask_cmpge_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4261
+ "_mm256_mask_cmpgt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4262
+ "_mm256_mask_cmple_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4263
+ "_mm256_mask_cmplt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4264
+ "_mm256_mask_cmpneq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4265
+ "_mm_cmp_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4266
+ "_mm_cmpeq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4267
+ "_mm_cmpge_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4268
+ "_mm_cmpgt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4269
+ "_mm_cmple_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4270
+ "_mm_cmplt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4271
+ "_mm_cmpneq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4272
+ "_mm_mask_cmp_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4273
+ "_mm_mask_cmpeq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4274
+ "_mm_mask_cmpge_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4275
+ "_mm_mask_cmpgt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4276
+ "_mm_mask_cmple_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4277
+ "_mm_mask_cmplt_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4278
+ "_mm_mask_cmpneq_epi32_mask"=>[["AVX512VL", "AVX512F"]],
4279
+ "_mm256_cmp_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4280
+ "_mm256_cmpeq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4281
+ "_mm256_cmpge_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4282
+ "_mm256_cmpgt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4283
+ "_mm256_cmple_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4284
+ "_mm256_cmplt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4285
+ "_mm256_cmpneq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4286
+ "_mm256_mask_cmp_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4287
+ "_mm256_mask_cmpeq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4288
+ "_mm256_mask_cmpge_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4289
+ "_mm256_mask_cmpgt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4290
+ "_mm256_mask_cmple_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4291
+ "_mm256_mask_cmplt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4292
+ "_mm256_mask_cmpneq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4293
+ "_mm_cmp_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4294
+ "_mm_cmpeq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4295
+ "_mm_cmpge_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4296
+ "_mm_cmpgt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4297
+ "_mm_cmple_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4298
+ "_mm_cmplt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4299
+ "_mm_cmpneq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4300
+ "_mm_mask_cmp_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4301
+ "_mm_mask_cmpeq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4302
+ "_mm_mask_cmpge_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4303
+ "_mm_mask_cmpgt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4304
+ "_mm_mask_cmple_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4305
+ "_mm_mask_cmplt_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4306
+ "_mm_mask_cmpneq_epi64_mask"=>[["AVX512VL", "AVX512F"]],
4307
+ "_mm256_cmp_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4308
+ "_mm256_cmpeq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4309
+ "_mm256_cmpge_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4310
+ "_mm256_cmpgt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4311
+ "_mm256_cmple_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4312
+ "_mm256_cmplt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4313
+ "_mm256_cmpneq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4314
+ "_mm256_mask_cmp_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4315
+ "_mm256_mask_cmpeq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4316
+ "_mm256_mask_cmpge_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4317
+ "_mm256_mask_cmpgt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4318
+ "_mm256_mask_cmple_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4319
+ "_mm256_mask_cmplt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4320
+ "_mm256_mask_cmpneq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4321
4321
  "_mm512_cmp_epu8_mask"=>["AVX512BW"],
4322
4322
  "_mm512_cmpeq_epu8_mask"=>["AVX512BW"],
4323
4323
  "_mm512_cmpge_epu8_mask"=>["AVX512BW"],
@@ -4332,90 +4332,90 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
4332
4332
  "_mm512_mask_cmple_epu8_mask"=>["AVX512BW"],
4333
4333
  "_mm512_mask_cmplt_epu8_mask"=>["AVX512BW"],
4334
4334
  "_mm512_mask_cmpneq_epu8_mask"=>["AVX512BW"],
4335
- "_mm_cmp_epu8_mask"=>["AVX512VL", "AVX512BW"],
4336
- "_mm_cmpeq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4337
- "_mm_cmpge_epu8_mask"=>["AVX512VL", "AVX512BW"],
4338
- "_mm_cmpgt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4339
- "_mm_cmple_epu8_mask"=>["AVX512VL", "AVX512BW"],
4340
- "_mm_cmplt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4341
- "_mm_cmpneq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4342
- "_mm_mask_cmp_epu8_mask"=>["AVX512VL", "AVX512BW"],
4343
- "_mm_mask_cmpeq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4344
- "_mm_mask_cmpge_epu8_mask"=>["AVX512VL", "AVX512BW"],
4345
- "_mm_mask_cmpgt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4346
- "_mm_mask_cmple_epu8_mask"=>["AVX512VL", "AVX512BW"],
4347
- "_mm_mask_cmplt_epu8_mask"=>["AVX512VL", "AVX512BW"],
4348
- "_mm_mask_cmpneq_epu8_mask"=>["AVX512VL", "AVX512BW"],
4349
- "_mm256_cmp_epu32_mask"=>["AVX512VL", "AVX512F"],
4350
- "_mm256_cmpeq_epu32_mask"=>["AVX512VL", "AVX512F"],
4351
- "_mm256_cmpge_epu32_mask"=>["AVX512VL", "AVX512F"],
4352
- "_mm256_cmpgt_epu32_mask"=>["AVX512VL", "AVX512F"],
4353
- "_mm256_cmple_epu32_mask"=>["AVX512VL", "AVX512F"],
4354
- "_mm256_cmplt_epu32_mask"=>["AVX512VL", "AVX512F"],
4355
- "_mm256_cmpneq_epu32_mask"=>["AVX512VL", "AVX512F"],
4356
- "_mm256_mask_cmp_epu32_mask"=>["AVX512VL", "AVX512F"],
4357
- "_mm256_mask_cmpeq_epu32_mask"=>["AVX512VL", "AVX512F"],
4358
- "_mm256_mask_cmpge_epu32_mask"=>["AVX512VL", "AVX512F"],
4359
- "_mm256_mask_cmpgt_epu32_mask"=>["AVX512VL", "AVX512F"],
4360
- "_mm256_mask_cmple_epu32_mask"=>["AVX512VL", "AVX512F"],
4361
- "_mm256_mask_cmplt_epu32_mask"=>["AVX512VL", "AVX512F"],
4362
- "_mm256_mask_cmpneq_epu32_mask"=>["AVX512VL", "AVX512F"],
4363
- "_mm_cmp_epu32_mask"=>["AVX512VL", "AVX512F"],
4364
- "_mm_cmpeq_epu32_mask"=>["AVX512VL", "AVX512F"],
4365
- "_mm_cmpge_epu32_mask"=>["AVX512VL", "AVX512F"],
4366
- "_mm_cmpgt_epu32_mask"=>["AVX512VL", "AVX512F"],
4367
- "_mm_cmple_epu32_mask"=>["AVX512VL", "AVX512F"],
4368
- "_mm_cmplt_epu32_mask"=>["AVX512VL", "AVX512F"],
4369
- "_mm_cmpneq_epu32_mask"=>["AVX512VL", "AVX512F"],
4370
- "_mm_mask_cmp_epu32_mask"=>["AVX512VL", "AVX512F"],
4371
- "_mm_mask_cmpeq_epu32_mask"=>["AVX512VL", "AVX512F"],
4372
- "_mm_mask_cmpge_epu32_mask"=>["AVX512VL", "AVX512F"],
4373
- "_mm_mask_cmpgt_epu32_mask"=>["AVX512VL", "AVX512F"],
4374
- "_mm_mask_cmple_epu32_mask"=>["AVX512VL", "AVX512F"],
4375
- "_mm_mask_cmplt_epu32_mask"=>["AVX512VL", "AVX512F"],
4376
- "_mm_mask_cmpneq_epu32_mask"=>["AVX512VL", "AVX512F"],
4377
- "_mm256_cmp_epu64_mask"=>["AVX512VL", "AVX512F"],
4378
- "_mm256_cmpeq_epu64_mask"=>["AVX512VL", "AVX512F"],
4379
- "_mm256_cmpge_epu64_mask"=>["AVX512VL", "AVX512F"],
4380
- "_mm256_cmpgt_epu64_mask"=>["AVX512VL", "AVX512F"],
4381
- "_mm256_cmple_epu64_mask"=>["AVX512VL", "AVX512F"],
4382
- "_mm256_cmplt_epu64_mask"=>["AVX512VL", "AVX512F"],
4383
- "_mm256_cmpneq_epu64_mask"=>["AVX512VL", "AVX512F"],
4384
- "_mm256_mask_cmp_epu64_mask"=>["AVX512VL", "AVX512F"],
4385
- "_mm256_mask_cmpeq_epu64_mask"=>["AVX512VL", "AVX512F"],
4386
- "_mm256_mask_cmpge_epu64_mask"=>["AVX512VL", "AVX512F"],
4387
- "_mm256_mask_cmpgt_epu64_mask"=>["AVX512VL", "AVX512F"],
4388
- "_mm256_mask_cmple_epu64_mask"=>["AVX512VL", "AVX512F"],
4389
- "_mm256_mask_cmplt_epu64_mask"=>["AVX512VL", "AVX512F"],
4390
- "_mm256_mask_cmpneq_epu64_mask"=>["AVX512VL", "AVX512F"],
4391
- "_mm_cmp_epu64_mask"=>["AVX512VL", "AVX512F"],
4392
- "_mm_cmpeq_epu64_mask"=>["AVX512VL", "AVX512F"],
4393
- "_mm_cmpge_epu64_mask"=>["AVX512VL", "AVX512F"],
4394
- "_mm_cmpgt_epu64_mask"=>["AVX512VL", "AVX512F"],
4395
- "_mm_cmple_epu64_mask"=>["AVX512VL", "AVX512F"],
4396
- "_mm_cmplt_epu64_mask"=>["AVX512VL", "AVX512F"],
4397
- "_mm_cmpneq_epu64_mask"=>["AVX512VL", "AVX512F"],
4398
- "_mm_mask_cmp_epu64_mask"=>["AVX512VL", "AVX512F"],
4399
- "_mm_mask_cmpeq_epu64_mask"=>["AVX512VL", "AVX512F"],
4400
- "_mm_mask_cmpge_epu64_mask"=>["AVX512VL", "AVX512F"],
4401
- "_mm_mask_cmpgt_epu64_mask"=>["AVX512VL", "AVX512F"],
4402
- "_mm_mask_cmple_epu64_mask"=>["AVX512VL", "AVX512F"],
4403
- "_mm_mask_cmplt_epu64_mask"=>["AVX512VL", "AVX512F"],
4404
- "_mm_mask_cmpneq_epu64_mask"=>["AVX512VL", "AVX512F"],
4405
- "_mm256_cmp_epu16_mask"=>["AVX512VL", "AVX512BW"],
4406
- "_mm256_cmpeq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4407
- "_mm256_cmpge_epu16_mask"=>["AVX512VL", "AVX512BW"],
4408
- "_mm256_cmpgt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4409
- "_mm256_cmple_epu16_mask"=>["AVX512VL", "AVX512BW"],
4410
- "_mm256_cmplt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4411
- "_mm256_cmpneq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4412
- "_mm256_mask_cmp_epu16_mask"=>["AVX512VL", "AVX512BW"],
4413
- "_mm256_mask_cmpeq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4414
- "_mm256_mask_cmpge_epu16_mask"=>["AVX512VL", "AVX512BW"],
4415
- "_mm256_mask_cmpgt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4416
- "_mm256_mask_cmple_epu16_mask"=>["AVX512VL", "AVX512BW"],
4417
- "_mm256_mask_cmplt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4418
- "_mm256_mask_cmpneq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4335
+ "_mm_cmp_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4336
+ "_mm_cmpeq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4337
+ "_mm_cmpge_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4338
+ "_mm_cmpgt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4339
+ "_mm_cmple_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4340
+ "_mm_cmplt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4341
+ "_mm_cmpneq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4342
+ "_mm_mask_cmp_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4343
+ "_mm_mask_cmpeq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4344
+ "_mm_mask_cmpge_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4345
+ "_mm_mask_cmpgt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4346
+ "_mm_mask_cmple_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4347
+ "_mm_mask_cmplt_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4348
+ "_mm_mask_cmpneq_epu8_mask"=>[["AVX512VL", "AVX512BW"]],
4349
+ "_mm256_cmp_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4350
+ "_mm256_cmpeq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4351
+ "_mm256_cmpge_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4352
+ "_mm256_cmpgt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4353
+ "_mm256_cmple_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4354
+ "_mm256_cmplt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4355
+ "_mm256_cmpneq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4356
+ "_mm256_mask_cmp_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4357
+ "_mm256_mask_cmpeq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4358
+ "_mm256_mask_cmpge_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4359
+ "_mm256_mask_cmpgt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4360
+ "_mm256_mask_cmple_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4361
+ "_mm256_mask_cmplt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4362
+ "_mm256_mask_cmpneq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4363
+ "_mm_cmp_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4364
+ "_mm_cmpeq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4365
+ "_mm_cmpge_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4366
+ "_mm_cmpgt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4367
+ "_mm_cmple_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4368
+ "_mm_cmplt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4369
+ "_mm_cmpneq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4370
+ "_mm_mask_cmp_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4371
+ "_mm_mask_cmpeq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4372
+ "_mm_mask_cmpge_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4373
+ "_mm_mask_cmpgt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4374
+ "_mm_mask_cmple_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4375
+ "_mm_mask_cmplt_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4376
+ "_mm_mask_cmpneq_epu32_mask"=>[["AVX512VL", "AVX512F"]],
4377
+ "_mm256_cmp_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4378
+ "_mm256_cmpeq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4379
+ "_mm256_cmpge_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4380
+ "_mm256_cmpgt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4381
+ "_mm256_cmple_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4382
+ "_mm256_cmplt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4383
+ "_mm256_cmpneq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4384
+ "_mm256_mask_cmp_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4385
+ "_mm256_mask_cmpeq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4386
+ "_mm256_mask_cmpge_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4387
+ "_mm256_mask_cmpgt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4388
+ "_mm256_mask_cmple_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4389
+ "_mm256_mask_cmplt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4390
+ "_mm256_mask_cmpneq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4391
+ "_mm_cmp_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4392
+ "_mm_cmpeq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4393
+ "_mm_cmpge_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4394
+ "_mm_cmpgt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4395
+ "_mm_cmple_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4396
+ "_mm_cmplt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4397
+ "_mm_cmpneq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4398
+ "_mm_mask_cmp_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4399
+ "_mm_mask_cmpeq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4400
+ "_mm_mask_cmpge_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4401
+ "_mm_mask_cmpgt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4402
+ "_mm_mask_cmple_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4403
+ "_mm_mask_cmplt_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4404
+ "_mm_mask_cmpneq_epu64_mask"=>[["AVX512VL", "AVX512F"]],
4405
+ "_mm256_cmp_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4406
+ "_mm256_cmpeq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4407
+ "_mm256_cmpge_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4408
+ "_mm256_cmpgt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4409
+ "_mm256_cmple_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4410
+ "_mm256_cmplt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4411
+ "_mm256_cmpneq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4412
+ "_mm256_mask_cmp_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4413
+ "_mm256_mask_cmpeq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4414
+ "_mm256_mask_cmpge_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4415
+ "_mm256_mask_cmpgt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4416
+ "_mm256_mask_cmple_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4417
+ "_mm256_mask_cmplt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4418
+ "_mm256_mask_cmpneq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4419
4419
  "_mm512_cmp_epu16_mask"=>["AVX512BW"],
4420
4420
  "_mm512_cmpeq_epu16_mask"=>["AVX512BW"],
4421
4421
  "_mm512_cmpge_epu16_mask"=>["AVX512BW"],
@@ -4430,34 +4430,34 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
4430
4430
  "_mm512_mask_cmple_epu16_mask"=>["AVX512BW"],
4431
4431
  "_mm512_mask_cmplt_epu16_mask"=>["AVX512BW"],
4432
4432
  "_mm512_mask_cmpneq_epu16_mask"=>["AVX512BW"],
4433
- "_mm_cmp_epu16_mask"=>["AVX512VL", "AVX512BW"],
4434
- "_mm_cmpeq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4435
- "_mm_cmpge_epu16_mask"=>["AVX512VL", "AVX512BW"],
4436
- "_mm_cmpgt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4437
- "_mm_cmple_epu16_mask"=>["AVX512VL", "AVX512BW"],
4438
- "_mm_cmplt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4439
- "_mm_cmpneq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4440
- "_mm_mask_cmp_epu16_mask"=>["AVX512VL", "AVX512BW"],
4441
- "_mm_mask_cmpeq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4442
- "_mm_mask_cmpge_epu16_mask"=>["AVX512VL", "AVX512BW"],
4443
- "_mm_mask_cmpgt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4444
- "_mm_mask_cmple_epu16_mask"=>["AVX512VL", "AVX512BW"],
4445
- "_mm_mask_cmplt_epu16_mask"=>["AVX512VL", "AVX512BW"],
4446
- "_mm_mask_cmpneq_epu16_mask"=>["AVX512VL", "AVX512BW"],
4447
- "_mm256_cmp_epi16_mask"=>["AVX512VL", "AVX512BW"],
4448
- "_mm256_cmpeq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4449
- "_mm256_cmpge_epi16_mask"=>["AVX512VL", "AVX512BW"],
4450
- "_mm256_cmpgt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4451
- "_mm256_cmple_epi16_mask"=>["AVX512VL", "AVX512BW"],
4452
- "_mm256_cmplt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4453
- "_mm256_cmpneq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4454
- "_mm256_mask_cmp_epi16_mask"=>["AVX512VL", "AVX512BW"],
4455
- "_mm256_mask_cmpeq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4456
- "_mm256_mask_cmpge_epi16_mask"=>["AVX512VL", "AVX512BW"],
4457
- "_mm256_mask_cmpgt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4458
- "_mm256_mask_cmple_epi16_mask"=>["AVX512VL", "AVX512BW"],
4459
- "_mm256_mask_cmplt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4460
- "_mm256_mask_cmpneq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4433
+ "_mm_cmp_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4434
+ "_mm_cmpeq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4435
+ "_mm_cmpge_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4436
+ "_mm_cmpgt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4437
+ "_mm_cmple_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4438
+ "_mm_cmplt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4439
+ "_mm_cmpneq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4440
+ "_mm_mask_cmp_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4441
+ "_mm_mask_cmpeq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4442
+ "_mm_mask_cmpge_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4443
+ "_mm_mask_cmpgt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4444
+ "_mm_mask_cmple_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4445
+ "_mm_mask_cmplt_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4446
+ "_mm_mask_cmpneq_epu16_mask"=>[["AVX512VL", "AVX512BW"]],
4447
+ "_mm256_cmp_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4448
+ "_mm256_cmpeq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4449
+ "_mm256_cmpge_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4450
+ "_mm256_cmpgt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4451
+ "_mm256_cmple_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4452
+ "_mm256_cmplt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4453
+ "_mm256_cmpneq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4454
+ "_mm256_mask_cmp_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4455
+ "_mm256_mask_cmpeq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4456
+ "_mm256_mask_cmpge_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4457
+ "_mm256_mask_cmpgt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4458
+ "_mm256_mask_cmple_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4459
+ "_mm256_mask_cmplt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4460
+ "_mm256_mask_cmpneq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4461
4461
  "_mm512_cmp_epi16_mask"=>["AVX512BW"],
4462
4462
  "_mm512_cmpeq_epi16_mask"=>["AVX512BW"],
4463
4463
  "_mm512_cmpge_epi16_mask"=>["AVX512BW"],
@@ -4472,986 +4472,986 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
4472
4472
  "_mm512_mask_cmple_epi16_mask"=>["AVX512BW"],
4473
4473
  "_mm512_mask_cmplt_epi16_mask"=>["AVX512BW"],
4474
4474
  "_mm512_mask_cmpneq_epi16_mask"=>["AVX512BW"],
4475
- "_mm_cmp_epi16_mask"=>["AVX512VL", "AVX512BW"],
4476
- "_mm_cmpeq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4477
- "_mm_cmpge_epi16_mask"=>["AVX512VL", "AVX512BW"],
4478
- "_mm_cmpgt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4479
- "_mm_cmple_epi16_mask"=>["AVX512VL", "AVX512BW"],
4480
- "_mm_cmplt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4481
- "_mm_cmpneq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4482
- "_mm_mask_cmp_epi16_mask"=>["AVX512VL", "AVX512BW"],
4483
- "_mm_mask_cmpeq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4484
- "_mm_mask_cmpge_epi16_mask"=>["AVX512VL", "AVX512BW"],
4485
- "_mm_mask_cmpgt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4486
- "_mm_mask_cmple_epi16_mask"=>["AVX512VL", "AVX512BW"],
4487
- "_mm_mask_cmplt_epi16_mask"=>["AVX512VL", "AVX512BW"],
4488
- "_mm_mask_cmpneq_epi16_mask"=>["AVX512VL", "AVX512BW"],
4489
- "_mm256_mask_compress_epi32"=>["AVX512VL", "AVX512F"],
4490
- "_mm256_mask_compressstoreu_epi32"=>["AVX512VL", "AVX512F"],
4491
- "_mm256_maskz_compress_epi32"=>["AVX512VL", "AVX512F"],
4492
- "_mm_mask_compress_epi32"=>["AVX512VL", "AVX512F"],
4493
- "_mm_mask_compressstoreu_epi32"=>["AVX512VL", "AVX512F"],
4494
- "_mm_maskz_compress_epi32"=>["AVX512VL", "AVX512F"],
4495
- "_mm256_mask_compress_epi64"=>["AVX512VL", "AVX512F"],
4496
- "_mm256_mask_compressstoreu_epi64"=>["AVX512VL", "AVX512F"],
4497
- "_mm256_maskz_compress_epi64"=>["AVX512VL", "AVX512F"],
4498
- "_mm_mask_compress_epi64"=>["AVX512VL", "AVX512F"],
4499
- "_mm_mask_compressstoreu_epi64"=>["AVX512VL", "AVX512F"],
4500
- "_mm_maskz_compress_epi64"=>["AVX512VL", "AVX512F"],
4501
- "_mm256_conflict_epi32"=>["AVX512VL", "AVX512CD"],
4502
- "_mm256_mask_conflict_epi32"=>["AVX512VL", "AVX512CD"],
4503
- "_mm256_maskz_conflict_epi32"=>["AVX512VL", "AVX512CD"],
4504
- "_mm_conflict_epi32"=>["AVX512VL", "AVX512CD"],
4505
- "_mm_mask_conflict_epi32"=>["AVX512VL", "AVX512CD"],
4506
- "_mm_maskz_conflict_epi32"=>["AVX512VL", "AVX512CD"],
4507
- "_mm256_conflict_epi64"=>["AVX512VL", "AVX512CD"],
4508
- "_mm256_mask_conflict_epi64"=>["AVX512VL", "AVX512CD"],
4509
- "_mm256_maskz_conflict_epi64"=>["AVX512VL", "AVX512CD"],
4510
- "_mm_conflict_epi64"=>["AVX512VL", "AVX512CD"],
4511
- "_mm_mask_conflict_epi64"=>["AVX512VL", "AVX512CD"],
4512
- "_mm_maskz_conflict_epi64"=>["AVX512VL", "AVX512CD"],
4513
- "_mm256_mask_permutexvar_epi32"=>["AVX512VL", "AVX512F"],
4514
- "_mm256_maskz_permutexvar_epi32"=>["AVX512VL", "AVX512F"],
4515
- "_mm256_permutexvar_epi32"=>["AVX512VL", "AVX512F"],
4516
- "_mm256_mask2_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4517
- "_mm256_mask_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4518
- "_mm256_maskz_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4519
- "_mm256_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4520
- "_mm_mask2_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4521
- "_mm_mask_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4522
- "_mm_maskz_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4523
- "_mm_permutex2var_epi32"=>["AVX512VL", "AVX512F"],
4524
- "_mm256_mask2_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4525
- "_mm256_mask_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4526
- "_mm256_maskz_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4527
- "_mm256_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4528
- "_mm_mask2_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4529
- "_mm_mask_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4530
- "_mm_maskz_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4531
- "_mm_permutex2var_pd"=>["AVX512VL", "AVX512F"],
4532
- "_mm256_mask2_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4533
- "_mm256_mask_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4534
- "_mm256_maskz_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4535
- "_mm256_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4536
- "_mm_mask2_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4537
- "_mm_mask_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4538
- "_mm_maskz_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4539
- "_mm_permutex2var_ps"=>["AVX512VL", "AVX512F"],
4540
- "_mm256_mask2_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4541
- "_mm256_mask_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4542
- "_mm256_maskz_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4543
- "_mm256_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4544
- "_mm_mask2_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4545
- "_mm_mask_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4546
- "_mm_maskz_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4547
- "_mm_permutex2var_epi64"=>["AVX512VL", "AVX512F"],
4548
- "_mm256_mask2_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4549
- "_mm256_mask_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4550
- "_mm256_maskz_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4551
- "_mm256_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4475
+ "_mm_cmp_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4476
+ "_mm_cmpeq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4477
+ "_mm_cmpge_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4478
+ "_mm_cmpgt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4479
+ "_mm_cmple_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4480
+ "_mm_cmplt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4481
+ "_mm_cmpneq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4482
+ "_mm_mask_cmp_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4483
+ "_mm_mask_cmpeq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4484
+ "_mm_mask_cmpge_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4485
+ "_mm_mask_cmpgt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4486
+ "_mm_mask_cmple_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4487
+ "_mm_mask_cmplt_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4488
+ "_mm_mask_cmpneq_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
4489
+ "_mm256_mask_compress_epi32"=>[["AVX512VL", "AVX512F"]],
4490
+ "_mm256_mask_compressstoreu_epi32"=>[["AVX512VL", "AVX512F"]],
4491
+ "_mm256_maskz_compress_epi32"=>[["AVX512VL", "AVX512F"]],
4492
+ "_mm_mask_compress_epi32"=>[["AVX512VL", "AVX512F"]],
4493
+ "_mm_mask_compressstoreu_epi32"=>[["AVX512VL", "AVX512F"]],
4494
+ "_mm_maskz_compress_epi32"=>[["AVX512VL", "AVX512F"]],
4495
+ "_mm256_mask_compress_epi64"=>[["AVX512VL", "AVX512F"]],
4496
+ "_mm256_mask_compressstoreu_epi64"=>[["AVX512VL", "AVX512F"]],
4497
+ "_mm256_maskz_compress_epi64"=>[["AVX512VL", "AVX512F"]],
4498
+ "_mm_mask_compress_epi64"=>[["AVX512VL", "AVX512F"]],
4499
+ "_mm_mask_compressstoreu_epi64"=>[["AVX512VL", "AVX512F"]],
4500
+ "_mm_maskz_compress_epi64"=>[["AVX512VL", "AVX512F"]],
4501
+ "_mm256_conflict_epi32"=>[["AVX512VL", "AVX512CD"]],
4502
+ "_mm256_mask_conflict_epi32"=>[["AVX512VL", "AVX512CD"]],
4503
+ "_mm256_maskz_conflict_epi32"=>[["AVX512VL", "AVX512CD"]],
4504
+ "_mm_conflict_epi32"=>[["AVX512VL", "AVX512CD"]],
4505
+ "_mm_mask_conflict_epi32"=>[["AVX512VL", "AVX512CD"]],
4506
+ "_mm_maskz_conflict_epi32"=>[["AVX512VL", "AVX512CD"]],
4507
+ "_mm256_conflict_epi64"=>[["AVX512VL", "AVX512CD"]],
4508
+ "_mm256_mask_conflict_epi64"=>[["AVX512VL", "AVX512CD"]],
4509
+ "_mm256_maskz_conflict_epi64"=>[["AVX512VL", "AVX512CD"]],
4510
+ "_mm_conflict_epi64"=>[["AVX512VL", "AVX512CD"]],
4511
+ "_mm_mask_conflict_epi64"=>[["AVX512VL", "AVX512CD"]],
4512
+ "_mm_maskz_conflict_epi64"=>[["AVX512VL", "AVX512CD"]],
4513
+ "_mm256_mask_permutexvar_epi32"=>[["AVX512VL", "AVX512F"]],
4514
+ "_mm256_maskz_permutexvar_epi32"=>[["AVX512VL", "AVX512F"]],
4515
+ "_mm256_permutexvar_epi32"=>[["AVX512VL", "AVX512F"]],
4516
+ "_mm256_mask2_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4517
+ "_mm256_mask_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4518
+ "_mm256_maskz_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4519
+ "_mm256_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4520
+ "_mm_mask2_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4521
+ "_mm_mask_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4522
+ "_mm_maskz_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4523
+ "_mm_permutex2var_epi32"=>[["AVX512VL", "AVX512F"]],
4524
+ "_mm256_mask2_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4525
+ "_mm256_mask_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4526
+ "_mm256_maskz_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4527
+ "_mm256_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4528
+ "_mm_mask2_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4529
+ "_mm_mask_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4530
+ "_mm_maskz_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4531
+ "_mm_permutex2var_pd"=>[["AVX512VL", "AVX512F"]],
4532
+ "_mm256_mask2_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4533
+ "_mm256_mask_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4534
+ "_mm256_maskz_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4535
+ "_mm256_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4536
+ "_mm_mask2_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4537
+ "_mm_mask_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4538
+ "_mm_maskz_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4539
+ "_mm_permutex2var_ps"=>[["AVX512VL", "AVX512F"]],
4540
+ "_mm256_mask2_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4541
+ "_mm256_mask_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4542
+ "_mm256_maskz_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4543
+ "_mm256_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4544
+ "_mm_mask2_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4545
+ "_mm_mask_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4546
+ "_mm_maskz_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4547
+ "_mm_permutex2var_epi64"=>[["AVX512VL", "AVX512F"]],
4548
+ "_mm256_mask2_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4549
+ "_mm256_mask_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4550
+ "_mm256_maskz_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4551
+ "_mm256_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4552
4552
  "_mm512_mask2_permutex2var_epi16"=>["AVX512BW"],
4553
4553
  "_mm512_mask_permutex2var_epi16"=>["AVX512BW"],
4554
4554
  "_mm512_maskz_permutex2var_epi16"=>["AVX512BW"],
4555
4555
  "_mm512_permutex2var_epi16"=>["AVX512BW"],
4556
- "_mm_mask2_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4557
- "_mm_mask_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4558
- "_mm_maskz_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4559
- "_mm_permutex2var_epi16"=>["AVX512VL", "AVX512BW"],
4560
- "_mm256_mask_permute_pd"=>["AVX512VL", "AVX512F"],
4561
- "_mm256_mask_permutevar_pd"=>["AVX512VL", "AVX512F"],
4562
- "_mm256_maskz_permute_pd"=>["AVX512VL", "AVX512F"],
4563
- "_mm256_maskz_permutevar_pd"=>["AVX512VL", "AVX512F"],
4564
- "_mm_mask_permute_pd"=>["AVX512VL", "AVX512F"],
4565
- "_mm_mask_permutevar_pd"=>["AVX512VL", "AVX512F"],
4566
- "_mm_maskz_permute_pd"=>["AVX512VL", "AVX512F"],
4567
- "_mm_maskz_permutevar_pd"=>["AVX512VL", "AVX512F"],
4568
- "_mm256_mask_permute_ps"=>["AVX512VL", "AVX512F"],
4569
- "_mm256_mask_permutevar_ps"=>["AVX512VL", "AVX512F"],
4570
- "_mm256_maskz_permute_ps"=>["AVX512VL", "AVX512F"],
4571
- "_mm256_maskz_permutevar_ps"=>["AVX512VL", "AVX512F"],
4572
- "_mm_mask_permute_ps"=>["AVX512VL", "AVX512F"],
4573
- "_mm_mask_permutevar_ps"=>["AVX512VL", "AVX512F"],
4574
- "_mm_maskz_permute_ps"=>["AVX512VL", "AVX512F"],
4575
- "_mm_maskz_permutevar_ps"=>["AVX512VL", "AVX512F"],
4576
- "_mm256_mask_permutex_pd"=>["AVX512VL", "AVX512F"],
4577
- "_mm256_mask_permutexvar_pd"=>["AVX512VL", "AVX512F"],
4578
- "_mm256_maskz_permutex_pd"=>["AVX512VL", "AVX512F"],
4579
- "_mm256_maskz_permutexvar_pd"=>["AVX512VL", "AVX512F"],
4580
- "_mm256_permutex_pd"=>["AVX512VL", "AVX512F"],
4581
- "_mm256_permutexvar_pd"=>["AVX512VL", "AVX512F"],
4582
- "_mm256_mask_permutexvar_ps"=>["AVX512VL", "AVX512F"],
4583
- "_mm256_maskz_permutexvar_ps"=>["AVX512VL", "AVX512F"],
4584
- "_mm256_permutexvar_ps"=>["AVX512VL", "AVX512F"],
4585
- "_mm256_mask_permutex_epi64"=>["AVX512VL", "AVX512F"],
4586
- "_mm256_mask_permutexvar_epi64"=>["AVX512VL", "AVX512F"],
4587
- "_mm256_maskz_permutex_epi64"=>["AVX512VL", "AVX512F"],
4588
- "_mm256_maskz_permutexvar_epi64"=>["AVX512VL", "AVX512F"],
4589
- "_mm256_permutex_epi64"=>["AVX512VL", "AVX512F"],
4590
- "_mm256_permutexvar_epi64"=>["AVX512VL", "AVX512F"],
4591
- "_mm256_mask_permutexvar_epi16"=>["AVX512VL", "AVX512BW"],
4592
- "_mm256_maskz_permutexvar_epi16"=>["AVX512VL", "AVX512BW"],
4593
- "_mm256_permutexvar_epi16"=>["AVX512VL", "AVX512BW"],
4556
+ "_mm_mask2_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4557
+ "_mm_mask_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4558
+ "_mm_maskz_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4559
+ "_mm_permutex2var_epi16"=>[["AVX512VL", "AVX512BW"]],
4560
+ "_mm256_mask_permute_pd"=>[["AVX512VL", "AVX512F"]],
4561
+ "_mm256_mask_permutevar_pd"=>[["AVX512VL", "AVX512F"]],
4562
+ "_mm256_maskz_permute_pd"=>[["AVX512VL", "AVX512F"]],
4563
+ "_mm256_maskz_permutevar_pd"=>[["AVX512VL", "AVX512F"]],
4564
+ "_mm_mask_permute_pd"=>[["AVX512VL", "AVX512F"]],
4565
+ "_mm_mask_permutevar_pd"=>[["AVX512VL", "AVX512F"]],
4566
+ "_mm_maskz_permute_pd"=>[["AVX512VL", "AVX512F"]],
4567
+ "_mm_maskz_permutevar_pd"=>[["AVX512VL", "AVX512F"]],
4568
+ "_mm256_mask_permute_ps"=>[["AVX512VL", "AVX512F"]],
4569
+ "_mm256_mask_permutevar_ps"=>[["AVX512VL", "AVX512F"]],
4570
+ "_mm256_maskz_permute_ps"=>[["AVX512VL", "AVX512F"]],
4571
+ "_mm256_maskz_permutevar_ps"=>[["AVX512VL", "AVX512F"]],
4572
+ "_mm_mask_permute_ps"=>[["AVX512VL", "AVX512F"]],
4573
+ "_mm_mask_permutevar_ps"=>[["AVX512VL", "AVX512F"]],
4574
+ "_mm_maskz_permute_ps"=>[["AVX512VL", "AVX512F"]],
4575
+ "_mm_maskz_permutevar_ps"=>[["AVX512VL", "AVX512F"]],
4576
+ "_mm256_mask_permutex_pd"=>[["AVX512VL", "AVX512F"]],
4577
+ "_mm256_mask_permutexvar_pd"=>[["AVX512VL", "AVX512F"]],
4578
+ "_mm256_maskz_permutex_pd"=>[["AVX512VL", "AVX512F"]],
4579
+ "_mm256_maskz_permutexvar_pd"=>[["AVX512VL", "AVX512F"]],
4580
+ "_mm256_permutex_pd"=>[["AVX512VL", "AVX512F"]],
4581
+ "_mm256_permutexvar_pd"=>[["AVX512VL", "AVX512F"]],
4582
+ "_mm256_mask_permutexvar_ps"=>[["AVX512VL", "AVX512F"]],
4583
+ "_mm256_maskz_permutexvar_ps"=>[["AVX512VL", "AVX512F"]],
4584
+ "_mm256_permutexvar_ps"=>[["AVX512VL", "AVX512F"]],
4585
+ "_mm256_mask_permutex_epi64"=>[["AVX512VL", "AVX512F"]],
4586
+ "_mm256_mask_permutexvar_epi64"=>[["AVX512VL", "AVX512F"]],
4587
+ "_mm256_maskz_permutex_epi64"=>[["AVX512VL", "AVX512F"]],
4588
+ "_mm256_maskz_permutexvar_epi64"=>[["AVX512VL", "AVX512F"]],
4589
+ "_mm256_permutex_epi64"=>[["AVX512VL", "AVX512F"]],
4590
+ "_mm256_permutexvar_epi64"=>[["AVX512VL", "AVX512F"]],
4591
+ "_mm256_mask_permutexvar_epi16"=>[["AVX512VL", "AVX512BW"]],
4592
+ "_mm256_maskz_permutexvar_epi16"=>[["AVX512VL", "AVX512BW"]],
4593
+ "_mm256_permutexvar_epi16"=>[["AVX512VL", "AVX512BW"]],
4594
4594
  "_mm512_mask_permutexvar_epi16"=>["AVX512BW"],
4595
4595
  "_mm512_maskz_permutexvar_epi16"=>["AVX512BW"],
4596
4596
  "_mm512_permutexvar_epi16"=>["AVX512BW"],
4597
- "_mm_mask_permutexvar_epi16"=>["AVX512VL", "AVX512BW"],
4598
- "_mm_maskz_permutexvar_epi16"=>["AVX512VL", "AVX512BW"],
4599
- "_mm_permutexvar_epi16"=>["AVX512VL", "AVX512BW"],
4600
- "_mm256_mask_expand_epi32"=>["AVX512VL", "AVX512F"],
4601
- "_mm256_mask_expandloadu_epi32"=>["AVX512VL", "AVX512F"],
4602
- "_mm256_maskz_expand_epi32"=>["AVX512VL", "AVX512F"],
4603
- "_mm256_maskz_expandloadu_epi32"=>["AVX512VL", "AVX512F"],
4604
- "_mm_mask_expand_epi32"=>["AVX512VL", "AVX512F"],
4605
- "_mm_mask_expandloadu_epi32"=>["AVX512VL", "AVX512F"],
4606
- "_mm_maskz_expand_epi32"=>["AVX512VL", "AVX512F"],
4607
- "_mm_maskz_expandloadu_epi32"=>["AVX512VL", "AVX512F"],
4608
- "_mm256_mask_expand_epi64"=>["AVX512VL", "AVX512F"],
4609
- "_mm256_mask_expandloadu_epi64"=>["AVX512VL", "AVX512F"],
4610
- "_mm256_maskz_expand_epi64"=>["AVX512VL", "AVX512F"],
4611
- "_mm256_maskz_expandloadu_epi64"=>["AVX512VL", "AVX512F"],
4612
- "_mm_mask_expand_epi64"=>["AVX512VL", "AVX512F"],
4613
- "_mm_mask_expandloadu_epi64"=>["AVX512VL", "AVX512F"],
4614
- "_mm_maskz_expand_epi64"=>["AVX512VL", "AVX512F"],
4615
- "_mm_maskz_expandloadu_epi64"=>["AVX512VL", "AVX512F"],
4616
- "_mm256_mmask_i32gather_epi32"=>["AVX512VL", "AVX512F"],
4617
- "_mm_mmask_i32gather_epi32"=>["AVX512VL", "AVX512F"],
4618
- "_mm256_mmask_i32gather_epi64"=>["AVX512VL", "AVX512F"],
4619
- "_mm_mmask_i32gather_epi64"=>["AVX512VL", "AVX512F"],
4620
- "_mm256_mmask_i64gather_epi32"=>["AVX512VL", "AVX512F"],
4621
- "_mm_mmask_i64gather_epi32"=>["AVX512VL", "AVX512F"],
4622
- "_mm256_mmask_i64gather_epi64"=>["AVX512VL", "AVX512F"],
4623
- "_mm_mmask_i64gather_epi64"=>["AVX512VL", "AVX512F"],
4624
- "_mm256_lzcnt_epi32"=>["AVX512VL", "AVX512CD"],
4625
- "_mm256_mask_lzcnt_epi32"=>["AVX512VL", "AVX512CD"],
4626
- "_mm256_maskz_lzcnt_epi32"=>["AVX512VL", "AVX512CD"],
4627
- "_mm_lzcnt_epi32"=>["AVX512VL", "AVX512CD"],
4628
- "_mm_mask_lzcnt_epi32"=>["AVX512VL", "AVX512CD"],
4629
- "_mm_maskz_lzcnt_epi32"=>["AVX512VL", "AVX512CD"],
4630
- "_mm256_lzcnt_epi64"=>["AVX512VL", "AVX512CD"],
4631
- "_mm256_mask_lzcnt_epi64"=>["AVX512VL", "AVX512CD"],
4632
- "_mm256_maskz_lzcnt_epi64"=>["AVX512VL", "AVX512CD"],
4633
- "_mm_lzcnt_epi64"=>["AVX512VL", "AVX512CD"],
4634
- "_mm_mask_lzcnt_epi64"=>["AVX512VL", "AVX512CD"],
4635
- "_mm_maskz_lzcnt_epi64"=>["AVX512VL", "AVX512CD"],
4636
- "_mm256_mask_maddubs_epi16"=>["AVX512VL", "AVX512BW"],
4637
- "_mm256_maskz_maddubs_epi16"=>["AVX512VL", "AVX512BW"],
4597
+ "_mm_mask_permutexvar_epi16"=>[["AVX512VL", "AVX512BW"]],
4598
+ "_mm_maskz_permutexvar_epi16"=>[["AVX512VL", "AVX512BW"]],
4599
+ "_mm_permutexvar_epi16"=>[["AVX512VL", "AVX512BW"]],
4600
+ "_mm256_mask_expand_epi32"=>[["AVX512VL", "AVX512F"]],
4601
+ "_mm256_mask_expandloadu_epi32"=>[["AVX512VL", "AVX512F"]],
4602
+ "_mm256_maskz_expand_epi32"=>[["AVX512VL", "AVX512F"]],
4603
+ "_mm256_maskz_expandloadu_epi32"=>[["AVX512VL", "AVX512F"]],
4604
+ "_mm_mask_expand_epi32"=>[["AVX512VL", "AVX512F"]],
4605
+ "_mm_mask_expandloadu_epi32"=>[["AVX512VL", "AVX512F"]],
4606
+ "_mm_maskz_expand_epi32"=>[["AVX512VL", "AVX512F"]],
4607
+ "_mm_maskz_expandloadu_epi32"=>[["AVX512VL", "AVX512F"]],
4608
+ "_mm256_mask_expand_epi64"=>[["AVX512VL", "AVX512F"]],
4609
+ "_mm256_mask_expandloadu_epi64"=>[["AVX512VL", "AVX512F"]],
4610
+ "_mm256_maskz_expand_epi64"=>[["AVX512VL", "AVX512F"]],
4611
+ "_mm256_maskz_expandloadu_epi64"=>[["AVX512VL", "AVX512F"]],
4612
+ "_mm_mask_expand_epi64"=>[["AVX512VL", "AVX512F"]],
4613
+ "_mm_mask_expandloadu_epi64"=>[["AVX512VL", "AVX512F"]],
4614
+ "_mm_maskz_expand_epi64"=>[["AVX512VL", "AVX512F"]],
4615
+ "_mm_maskz_expandloadu_epi64"=>[["AVX512VL", "AVX512F"]],
4616
+ "_mm256_mmask_i32gather_epi32"=>[["AVX512VL", "AVX512F"]],
4617
+ "_mm_mmask_i32gather_epi32"=>[["AVX512VL", "AVX512F"]],
4618
+ "_mm256_mmask_i32gather_epi64"=>[["AVX512VL", "AVX512F"]],
4619
+ "_mm_mmask_i32gather_epi64"=>[["AVX512VL", "AVX512F"]],
4620
+ "_mm256_mmask_i64gather_epi32"=>[["AVX512VL", "AVX512F"]],
4621
+ "_mm_mmask_i64gather_epi32"=>[["AVX512VL", "AVX512F"]],
4622
+ "_mm256_mmask_i64gather_epi64"=>[["AVX512VL", "AVX512F"]],
4623
+ "_mm_mmask_i64gather_epi64"=>[["AVX512VL", "AVX512F"]],
4624
+ "_mm256_lzcnt_epi32"=>[["AVX512VL", "AVX512CD"]],
4625
+ "_mm256_mask_lzcnt_epi32"=>[["AVX512VL", "AVX512CD"]],
4626
+ "_mm256_maskz_lzcnt_epi32"=>[["AVX512VL", "AVX512CD"]],
4627
+ "_mm_lzcnt_epi32"=>[["AVX512VL", "AVX512CD"]],
4628
+ "_mm_mask_lzcnt_epi32"=>[["AVX512VL", "AVX512CD"]],
4629
+ "_mm_maskz_lzcnt_epi32"=>[["AVX512VL", "AVX512CD"]],
4630
+ "_mm256_lzcnt_epi64"=>[["AVX512VL", "AVX512CD"]],
4631
+ "_mm256_mask_lzcnt_epi64"=>[["AVX512VL", "AVX512CD"]],
4632
+ "_mm256_maskz_lzcnt_epi64"=>[["AVX512VL", "AVX512CD"]],
4633
+ "_mm_lzcnt_epi64"=>[["AVX512VL", "AVX512CD"]],
4634
+ "_mm_mask_lzcnt_epi64"=>[["AVX512VL", "AVX512CD"]],
4635
+ "_mm_maskz_lzcnt_epi64"=>[["AVX512VL", "AVX512CD"]],
4636
+ "_mm256_mask_maddubs_epi16"=>[["AVX512VL", "AVX512BW"]],
4637
+ "_mm256_maskz_maddubs_epi16"=>[["AVX512VL", "AVX512BW"]],
4638
4638
  "_mm512_maddubs_epi16"=>["AVX512BW"],
4639
4639
  "_mm512_mask_maddubs_epi16"=>["AVX512BW"],
4640
4640
  "_mm512_maskz_maddubs_epi16"=>["AVX512BW"],
4641
- "_mm_mask_maddubs_epi16"=>["AVX512VL", "AVX512BW"],
4642
- "_mm_maskz_maddubs_epi16"=>["AVX512VL", "AVX512BW"],
4643
- "_mm256_mask_madd_epi16"=>["AVX512VL", "AVX512BW"],
4644
- "_mm256_maskz_madd_epi16"=>["AVX512VL", "AVX512BW"],
4641
+ "_mm_mask_maddubs_epi16"=>[["AVX512VL", "AVX512BW"]],
4642
+ "_mm_maskz_maddubs_epi16"=>[["AVX512VL", "AVX512BW"]],
4643
+ "_mm256_mask_madd_epi16"=>[["AVX512VL", "AVX512BW"]],
4644
+ "_mm256_maskz_madd_epi16"=>[["AVX512VL", "AVX512BW"]],
4645
4645
  "_mm512_madd_epi16"=>["AVX512BW"],
4646
4646
  "_mm512_mask_madd_epi16"=>["AVX512BW"],
4647
4647
  "_mm512_maskz_madd_epi16"=>["AVX512BW"],
4648
- "_mm_mask_madd_epi16"=>["AVX512VL", "AVX512BW"],
4649
- "_mm_maskz_madd_epi16"=>["AVX512VL", "AVX512BW"],
4650
- "_mm256_mask_max_epi8"=>["AVX512VL", "AVX512BW"],
4651
- "_mm256_maskz_max_epi8"=>["AVX512VL", "AVX512BW"],
4648
+ "_mm_mask_madd_epi16"=>[["AVX512VL", "AVX512BW"]],
4649
+ "_mm_maskz_madd_epi16"=>[["AVX512VL", "AVX512BW"]],
4650
+ "_mm256_mask_max_epi8"=>[["AVX512VL", "AVX512BW"]],
4651
+ "_mm256_maskz_max_epi8"=>[["AVX512VL", "AVX512BW"]],
4652
4652
  "_mm512_mask_max_epi8"=>["AVX512BW"],
4653
4653
  "_mm512_maskz_max_epi8"=>["AVX512BW"],
4654
4654
  "_mm512_max_epi8"=>["AVX512BW"],
4655
- "_mm_mask_max_epi8"=>["AVX512VL", "AVX512BW"],
4656
- "_mm_maskz_max_epi8"=>["AVX512VL", "AVX512BW"],
4657
- "_mm256_mask_max_epi32"=>["AVX512VL", "AVX512F"],
4658
- "_mm256_maskz_max_epi32"=>["AVX512VL", "AVX512F"],
4659
- "_mm_mask_max_epi32"=>["AVX512VL", "AVX512F"],
4660
- "_mm_maskz_max_epi32"=>["AVX512VL", "AVX512F"],
4661
- "_mm256_mask_max_epi64"=>["AVX512VL", "AVX512F"],
4662
- "_mm256_maskz_max_epi64"=>["AVX512VL", "AVX512F"],
4663
- "_mm256_max_epi64"=>["AVX512VL", "AVX512F"],
4664
- "_mm_mask_max_epi64"=>["AVX512VL", "AVX512F"],
4665
- "_mm_maskz_max_epi64"=>["AVX512VL", "AVX512F"],
4666
- "_mm_max_epi64"=>["AVX512VL", "AVX512F"],
4667
- "_mm256_mask_max_epi16"=>["AVX512VL", "AVX512BW"],
4668
- "_mm256_maskz_max_epi16"=>["AVX512VL", "AVX512BW"],
4655
+ "_mm_mask_max_epi8"=>[["AVX512VL", "AVX512BW"]],
4656
+ "_mm_maskz_max_epi8"=>[["AVX512VL", "AVX512BW"]],
4657
+ "_mm256_mask_max_epi32"=>[["AVX512VL", "AVX512F"]],
4658
+ "_mm256_maskz_max_epi32"=>[["AVX512VL", "AVX512F"]],
4659
+ "_mm_mask_max_epi32"=>[["AVX512VL", "AVX512F"]],
4660
+ "_mm_maskz_max_epi32"=>[["AVX512VL", "AVX512F"]],
4661
+ "_mm256_mask_max_epi64"=>[["AVX512VL", "AVX512F"]],
4662
+ "_mm256_maskz_max_epi64"=>[["AVX512VL", "AVX512F"]],
4663
+ "_mm256_max_epi64"=>[["AVX512VL", "AVX512F"]],
4664
+ "_mm_mask_max_epi64"=>[["AVX512VL", "AVX512F"]],
4665
+ "_mm_maskz_max_epi64"=>[["AVX512VL", "AVX512F"]],
4666
+ "_mm_max_epi64"=>[["AVX512VL", "AVX512F"]],
4667
+ "_mm256_mask_max_epi16"=>[["AVX512VL", "AVX512BW"]],
4668
+ "_mm256_maskz_max_epi16"=>[["AVX512VL", "AVX512BW"]],
4669
4669
  "_mm512_mask_max_epi16"=>["AVX512BW"],
4670
4670
  "_mm512_maskz_max_epi16"=>["AVX512BW"],
4671
4671
  "_mm512_max_epi16"=>["AVX512BW"],
4672
- "_mm_mask_max_epi16"=>["AVX512VL", "AVX512BW"],
4673
- "_mm_maskz_max_epi16"=>["AVX512VL", "AVX512BW"],
4674
- "_mm256_mask_max_epu8"=>["AVX512VL", "AVX512BW"],
4675
- "_mm256_maskz_max_epu8"=>["AVX512VL", "AVX512BW"],
4672
+ "_mm_mask_max_epi16"=>[["AVX512VL", "AVX512BW"]],
4673
+ "_mm_maskz_max_epi16"=>[["AVX512VL", "AVX512BW"]],
4674
+ "_mm256_mask_max_epu8"=>[["AVX512VL", "AVX512BW"]],
4675
+ "_mm256_maskz_max_epu8"=>[["AVX512VL", "AVX512BW"]],
4676
4676
  "_mm512_mask_max_epu8"=>["AVX512BW"],
4677
4677
  "_mm512_maskz_max_epu8"=>["AVX512BW"],
4678
4678
  "_mm512_max_epu8"=>["AVX512BW"],
4679
- "_mm_mask_max_epu8"=>["AVX512VL", "AVX512BW"],
4680
- "_mm_maskz_max_epu8"=>["AVX512VL", "AVX512BW"],
4681
- "_mm256_mask_max_epu32"=>["AVX512VL", "AVX512F"],
4682
- "_mm256_maskz_max_epu32"=>["AVX512VL", "AVX512F"],
4683
- "_mm_mask_max_epu32"=>["AVX512VL", "AVX512F"],
4684
- "_mm_maskz_max_epu32"=>["AVX512VL", "AVX512F"],
4685
- "_mm256_mask_max_epu64"=>["AVX512VL", "AVX512F"],
4686
- "_mm256_maskz_max_epu64"=>["AVX512VL", "AVX512F"],
4687
- "_mm256_max_epu64"=>["AVX512VL", "AVX512F"],
4688
- "_mm_mask_max_epu64"=>["AVX512VL", "AVX512F"],
4689
- "_mm_maskz_max_epu64"=>["AVX512VL", "AVX512F"],
4690
- "_mm_max_epu64"=>["AVX512VL", "AVX512F"],
4691
- "_mm256_mask_max_epu16"=>["AVX512VL", "AVX512BW"],
4692
- "_mm256_maskz_max_epu16"=>["AVX512VL", "AVX512BW"],
4679
+ "_mm_mask_max_epu8"=>[["AVX512VL", "AVX512BW"]],
4680
+ "_mm_maskz_max_epu8"=>[["AVX512VL", "AVX512BW"]],
4681
+ "_mm256_mask_max_epu32"=>[["AVX512VL", "AVX512F"]],
4682
+ "_mm256_maskz_max_epu32"=>[["AVX512VL", "AVX512F"]],
4683
+ "_mm_mask_max_epu32"=>[["AVX512VL", "AVX512F"]],
4684
+ "_mm_maskz_max_epu32"=>[["AVX512VL", "AVX512F"]],
4685
+ "_mm256_mask_max_epu64"=>[["AVX512VL", "AVX512F"]],
4686
+ "_mm256_maskz_max_epu64"=>[["AVX512VL", "AVX512F"]],
4687
+ "_mm256_max_epu64"=>[["AVX512VL", "AVX512F"]],
4688
+ "_mm_mask_max_epu64"=>[["AVX512VL", "AVX512F"]],
4689
+ "_mm_maskz_max_epu64"=>[["AVX512VL", "AVX512F"]],
4690
+ "_mm_max_epu64"=>[["AVX512VL", "AVX512F"]],
4691
+ "_mm256_mask_max_epu16"=>[["AVX512VL", "AVX512BW"]],
4692
+ "_mm256_maskz_max_epu16"=>[["AVX512VL", "AVX512BW"]],
4693
4693
  "_mm512_mask_max_epu16"=>["AVX512BW"],
4694
4694
  "_mm512_maskz_max_epu16"=>["AVX512BW"],
4695
4695
  "_mm512_max_epu16"=>["AVX512BW"],
4696
- "_mm_mask_max_epu16"=>["AVX512VL", "AVX512BW"],
4697
- "_mm_maskz_max_epu16"=>["AVX512VL", "AVX512BW"],
4698
- "_mm256_mask_min_epi8"=>["AVX512VL", "AVX512BW"],
4699
- "_mm256_maskz_min_epi8"=>["AVX512VL", "AVX512BW"],
4696
+ "_mm_mask_max_epu16"=>[["AVX512VL", "AVX512BW"]],
4697
+ "_mm_maskz_max_epu16"=>[["AVX512VL", "AVX512BW"]],
4698
+ "_mm256_mask_min_epi8"=>[["AVX512VL", "AVX512BW"]],
4699
+ "_mm256_maskz_min_epi8"=>[["AVX512VL", "AVX512BW"]],
4700
4700
  "_mm512_mask_min_epi8"=>["AVX512BW"],
4701
4701
  "_mm512_maskz_min_epi8"=>["AVX512BW"],
4702
4702
  "_mm512_min_epi8"=>["AVX512BW"],
4703
- "_mm_mask_min_epi8"=>["AVX512VL", "AVX512BW"],
4704
- "_mm_maskz_min_epi8"=>["AVX512VL", "AVX512BW"],
4705
- "_mm256_mask_min_epi32"=>["AVX512VL", "AVX512F"],
4706
- "_mm256_maskz_min_epi32"=>["AVX512VL", "AVX512F"],
4707
- "_mm_mask_min_epi32"=>["AVX512VL", "AVX512F"],
4708
- "_mm_maskz_min_epi32"=>["AVX512VL", "AVX512F"],
4709
- "_mm256_mask_min_epi64"=>["AVX512VL", "AVX512F"],
4710
- "_mm256_maskz_min_epi64"=>["AVX512VL", "AVX512F"],
4711
- "_mm256_min_epi64"=>["AVX512VL", "AVX512F"],
4712
- "_mm_mask_min_epi64"=>["AVX512VL", "AVX512F"],
4713
- "_mm_maskz_min_epi64"=>["AVX512VL", "AVX512F"],
4714
- "_mm_min_epi64"=>["AVX512VL", "AVX512F"],
4715
- "_mm256_mask_min_epi16"=>["AVX512VL", "AVX512BW"],
4716
- "_mm256_maskz_min_epi16"=>["AVX512VL", "AVX512BW"],
4703
+ "_mm_mask_min_epi8"=>[["AVX512VL", "AVX512BW"]],
4704
+ "_mm_maskz_min_epi8"=>[["AVX512VL", "AVX512BW"]],
4705
+ "_mm256_mask_min_epi32"=>[["AVX512VL", "AVX512F"]],
4706
+ "_mm256_maskz_min_epi32"=>[["AVX512VL", "AVX512F"]],
4707
+ "_mm_mask_min_epi32"=>[["AVX512VL", "AVX512F"]],
4708
+ "_mm_maskz_min_epi32"=>[["AVX512VL", "AVX512F"]],
4709
+ "_mm256_mask_min_epi64"=>[["AVX512VL", "AVX512F"]],
4710
+ "_mm256_maskz_min_epi64"=>[["AVX512VL", "AVX512F"]],
4711
+ "_mm256_min_epi64"=>[["AVX512VL", "AVX512F"]],
4712
+ "_mm_mask_min_epi64"=>[["AVX512VL", "AVX512F"]],
4713
+ "_mm_maskz_min_epi64"=>[["AVX512VL", "AVX512F"]],
4714
+ "_mm_min_epi64"=>[["AVX512VL", "AVX512F"]],
4715
+ "_mm256_mask_min_epi16"=>[["AVX512VL", "AVX512BW"]],
4716
+ "_mm256_maskz_min_epi16"=>[["AVX512VL", "AVX512BW"]],
4717
4717
  "_mm512_mask_min_epi16"=>["AVX512BW"],
4718
4718
  "_mm512_maskz_min_epi16"=>["AVX512BW"],
4719
4719
  "_mm512_min_epi16"=>["AVX512BW"],
4720
- "_mm_mask_min_epi16"=>["AVX512VL", "AVX512BW"],
4721
- "_mm_maskz_min_epi16"=>["AVX512VL", "AVX512BW"],
4722
- "_mm256_mask_min_epu8"=>["AVX512VL", "AVX512BW"],
4723
- "_mm256_maskz_min_epu8"=>["AVX512VL", "AVX512BW"],
4720
+ "_mm_mask_min_epi16"=>[["AVX512VL", "AVX512BW"]],
4721
+ "_mm_maskz_min_epi16"=>[["AVX512VL", "AVX512BW"]],
4722
+ "_mm256_mask_min_epu8"=>[["AVX512VL", "AVX512BW"]],
4723
+ "_mm256_maskz_min_epu8"=>[["AVX512VL", "AVX512BW"]],
4724
4724
  "_mm512_mask_min_epu8"=>["AVX512BW"],
4725
4725
  "_mm512_maskz_min_epu8"=>["AVX512BW"],
4726
4726
  "_mm512_min_epu8"=>["AVX512BW"],
4727
- "_mm_mask_min_epu8"=>["AVX512VL", "AVX512BW"],
4728
- "_mm_maskz_min_epu8"=>["AVX512VL", "AVX512BW"],
4729
- "_mm256_mask_min_epu32"=>["AVX512VL", "AVX512F"],
4730
- "_mm256_maskz_min_epu32"=>["AVX512VL", "AVX512F"],
4731
- "_mm_mask_min_epu32"=>["AVX512VL", "AVX512F"],
4732
- "_mm_maskz_min_epu32"=>["AVX512VL", "AVX512F"],
4733
- "_mm256_mask_min_epu64"=>["AVX512VL", "AVX512F"],
4734
- "_mm256_maskz_min_epu64"=>["AVX512VL", "AVX512F"],
4735
- "_mm256_min_epu64"=>["AVX512VL", "AVX512F"],
4736
- "_mm_mask_min_epu64"=>["AVX512VL", "AVX512F"],
4737
- "_mm_maskz_min_epu64"=>["AVX512VL", "AVX512F"],
4738
- "_mm_min_epu64"=>["AVX512VL", "AVX512F"],
4739
- "_mm256_mask_min_epu16"=>["AVX512VL", "AVX512BW"],
4740
- "_mm256_maskz_min_epu16"=>["AVX512VL", "AVX512BW"],
4727
+ "_mm_mask_min_epu8"=>[["AVX512VL", "AVX512BW"]],
4728
+ "_mm_maskz_min_epu8"=>[["AVX512VL", "AVX512BW"]],
4729
+ "_mm256_mask_min_epu32"=>[["AVX512VL", "AVX512F"]],
4730
+ "_mm256_maskz_min_epu32"=>[["AVX512VL", "AVX512F"]],
4731
+ "_mm_mask_min_epu32"=>[["AVX512VL", "AVX512F"]],
4732
+ "_mm_maskz_min_epu32"=>[["AVX512VL", "AVX512F"]],
4733
+ "_mm256_mask_min_epu64"=>[["AVX512VL", "AVX512F"]],
4734
+ "_mm256_maskz_min_epu64"=>[["AVX512VL", "AVX512F"]],
4735
+ "_mm256_min_epu64"=>[["AVX512VL", "AVX512F"]],
4736
+ "_mm_mask_min_epu64"=>[["AVX512VL", "AVX512F"]],
4737
+ "_mm_maskz_min_epu64"=>[["AVX512VL", "AVX512F"]],
4738
+ "_mm_min_epu64"=>[["AVX512VL", "AVX512F"]],
4739
+ "_mm256_mask_min_epu16"=>[["AVX512VL", "AVX512BW"]],
4740
+ "_mm256_maskz_min_epu16"=>[["AVX512VL", "AVX512BW"]],
4741
4741
  "_mm512_mask_min_epu16"=>["AVX512BW"],
4742
4742
  "_mm512_maskz_min_epu16"=>["AVX512BW"],
4743
4743
  "_mm512_min_epu16"=>["AVX512BW"],
4744
- "_mm_mask_min_epu16"=>["AVX512VL", "AVX512BW"],
4745
- "_mm_maskz_min_epu16"=>["AVX512VL", "AVX512BW"],
4746
- "_mm256_movepi8_mask"=>["AVX512VL", "AVX512BW"],
4744
+ "_mm_mask_min_epu16"=>[["AVX512VL", "AVX512BW"]],
4745
+ "_mm_maskz_min_epu16"=>[["AVX512VL", "AVX512BW"]],
4746
+ "_mm256_movepi8_mask"=>[["AVX512VL", "AVX512BW"]],
4747
4747
  "_mm512_movepi8_mask"=>["AVX512BW"],
4748
- "_mm_movepi8_mask"=>["AVX512VL", "AVX512BW"],
4749
- "_mm256_movepi32_mask"=>["AVX512VL", "AVX512DQ"],
4748
+ "_mm_movepi8_mask"=>[["AVX512VL", "AVX512BW"]],
4749
+ "_mm256_movepi32_mask"=>[["AVX512VL", "AVX512DQ"]],
4750
4750
  "_mm512_movepi32_mask"=>["AVX512DQ"],
4751
- "_mm_movepi32_mask"=>["AVX512VL", "AVX512DQ"],
4752
- "_mm256_cvtepi32_epi8"=>["AVX512VL", "AVX512F"],
4753
- "_mm256_mask_cvtepi32_epi8"=>["AVX512VL", "AVX512F"],
4754
- "_mm256_mask_cvtepi32_storeu_epi8"=>["AVX512VL", "AVX512F"],
4755
- "_mm256_maskz_cvtepi32_epi8"=>["AVX512VL", "AVX512F"],
4756
- "_mm_cvtepi32_epi8"=>["AVX512VL", "AVX512F"],
4757
- "_mm_mask_cvtepi32_epi8"=>["AVX512VL", "AVX512F"],
4758
- "_mm_mask_cvtepi32_storeu_epi8"=>["AVX512VL", "AVX512F"],
4759
- "_mm_maskz_cvtepi32_epi8"=>["AVX512VL", "AVX512F"],
4760
- "_mm256_cvtepi32_epi16"=>["AVX512VL", "AVX512F"],
4761
- "_mm256_mask_cvtepi32_epi16"=>["AVX512VL", "AVX512F"],
4762
- "_mm256_mask_cvtepi32_storeu_epi16"=>["AVX512VL", "AVX512F"],
4763
- "_mm256_maskz_cvtepi32_epi16"=>["AVX512VL", "AVX512F"],
4764
- "_mm_cvtepi32_epi16"=>["AVX512VL", "AVX512F"],
4765
- "_mm_mask_cvtepi32_epi16"=>["AVX512VL", "AVX512F"],
4766
- "_mm_mask_cvtepi32_storeu_epi16"=>["AVX512VL", "AVX512F"],
4767
- "_mm_maskz_cvtepi32_epi16"=>["AVX512VL", "AVX512F"],
4768
- "_mm256_movm_epi8"=>["AVX512VL", "AVX512BW"],
4751
+ "_mm_movepi32_mask"=>[["AVX512VL", "AVX512DQ"]],
4752
+ "_mm256_cvtepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4753
+ "_mm256_mask_cvtepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4754
+ "_mm256_mask_cvtepi32_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4755
+ "_mm256_maskz_cvtepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4756
+ "_mm_cvtepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4757
+ "_mm_mask_cvtepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4758
+ "_mm_mask_cvtepi32_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4759
+ "_mm_maskz_cvtepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4760
+ "_mm256_cvtepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4761
+ "_mm256_mask_cvtepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4762
+ "_mm256_mask_cvtepi32_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4763
+ "_mm256_maskz_cvtepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4764
+ "_mm_cvtepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4765
+ "_mm_mask_cvtepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4766
+ "_mm_mask_cvtepi32_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4767
+ "_mm_maskz_cvtepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4768
+ "_mm256_movm_epi8"=>[["AVX512VL", "AVX512BW"]],
4769
4769
  "_mm512_movm_epi8"=>["AVX512BW"],
4770
- "_mm_movm_epi8"=>["AVX512BW", "AVX512VL"],
4771
- "_mm256_movm_epi32"=>["AVX512VL", "AVX512DQ"],
4770
+ "_mm_movm_epi8"=>[["AVX512BW", "AVX512VL"]],
4771
+ "_mm256_movm_epi32"=>[["AVX512VL", "AVX512DQ"]],
4772
4772
  "_mm512_movm_epi32"=>["AVX512DQ"],
4773
- "_mm_movm_epi32"=>["AVX512VL", "AVX512DQ"],
4774
- "_mm256_movm_epi64"=>["AVX512VL", "AVX512DQ"],
4773
+ "_mm_movm_epi32"=>[["AVX512VL", "AVX512DQ"]],
4774
+ "_mm256_movm_epi64"=>[["AVX512VL", "AVX512DQ"]],
4775
4775
  "_mm512_movm_epi64"=>["AVX512DQ"],
4776
- "_mm_movm_epi64"=>["AVX512VL", "AVX512DQ"],
4777
- "_mm256_movm_epi16"=>["AVX512VL", "AVX512BW"],
4776
+ "_mm_movm_epi64"=>[["AVX512VL", "AVX512DQ"]],
4777
+ "_mm256_movm_epi16"=>[["AVX512VL", "AVX512BW"]],
4778
4778
  "_mm512_movm_epi16"=>["AVX512BW"],
4779
- "_mm_movm_epi16"=>["AVX512VL", "AVX512BW"],
4780
- "_mm256_movepi64_mask"=>["AVX512VL", "AVX512DQ"],
4779
+ "_mm_movm_epi16"=>[["AVX512VL", "AVX512BW"]],
4780
+ "_mm256_movepi64_mask"=>[["AVX512VL", "AVX512DQ"]],
4781
4781
  "_mm512_movepi64_mask"=>["AVX512DQ"],
4782
- "_mm_movepi64_mask"=>["AVX512VL", "AVX512DQ"],
4783
- "_mm256_cvtepi64_epi8"=>["AVX512VL", "AVX512F"],
4784
- "_mm256_mask_cvtepi64_epi8"=>["AVX512VL", "AVX512F"],
4785
- "_mm256_mask_cvtepi64_storeu_epi8"=>["AVX512VL", "AVX512F"],
4786
- "_mm256_maskz_cvtepi64_epi8"=>["AVX512VL", "AVX512F"],
4787
- "_mm_cvtepi64_epi8"=>["AVX512VL", "AVX512F"],
4788
- "_mm_mask_cvtepi64_epi8"=>["AVX512VL", "AVX512F"],
4789
- "_mm_mask_cvtepi64_storeu_epi8"=>["AVX512VL", "AVX512F"],
4790
- "_mm_maskz_cvtepi64_epi8"=>["AVX512VL", "AVX512F"],
4791
- "_mm256_cvtepi64_epi32"=>["AVX512VL", "AVX512F"],
4792
- "_mm256_mask_cvtepi64_epi32"=>["AVX512VL", "AVX512F"],
4793
- "_mm256_mask_cvtepi64_storeu_epi32"=>["AVX512VL", "AVX512F"],
4794
- "_mm256_maskz_cvtepi64_epi32"=>["AVX512VL", "AVX512F"],
4795
- "_mm_cvtepi64_epi32"=>["AVX512VL", "AVX512F"],
4796
- "_mm_mask_cvtepi64_epi32"=>["AVX512VL", "AVX512F"],
4797
- "_mm_mask_cvtepi64_storeu_epi32"=>["AVX512VL", "AVX512F"],
4798
- "_mm_maskz_cvtepi64_epi32"=>["AVX512VL", "AVX512F"],
4799
- "_mm256_cvtepi64_epi16"=>["AVX512VL", "AVX512F"],
4800
- "_mm256_mask_cvtepi64_epi16"=>["AVX512VL", "AVX512F"],
4801
- "_mm256_mask_cvtepi64_storeu_epi16"=>["AVX512VL", "AVX512F"],
4802
- "_mm256_maskz_cvtepi64_epi16"=>["AVX512VL", "AVX512F"],
4803
- "_mm_cvtepi64_epi16"=>["AVX512VL", "AVX512F"],
4804
- "_mm_mask_cvtepi64_epi16"=>["AVX512VL", "AVX512F"],
4805
- "_mm_mask_cvtepi64_storeu_epi16"=>["AVX512VL", "AVX512F"],
4806
- "_mm_maskz_cvtepi64_epi16"=>["AVX512VL", "AVX512F"],
4807
- "_mm256_cvtsepi32_epi8"=>["AVX512VL", "AVX512F"],
4808
- "_mm256_mask_cvtsepi32_epi8"=>["AVX512VL", "AVX512F"],
4809
- "_mm256_mask_cvtsepi32_storeu_epi8"=>["AVX512VL", "AVX512F"],
4810
- "_mm256_maskz_cvtsepi32_epi8"=>["AVX512VL", "AVX512F"],
4811
- "_mm_cvtsepi32_epi8"=>["AVX512VL", "AVX512F"],
4812
- "_mm_mask_cvtsepi32_epi8"=>["AVX512VL", "AVX512F"],
4813
- "_mm_mask_cvtsepi32_storeu_epi8"=>["AVX512VL", "AVX512F"],
4814
- "_mm_maskz_cvtsepi32_epi8"=>["AVX512VL", "AVX512F"],
4815
- "_mm256_cvtsepi32_epi16"=>["AVX512VL", "AVX512F"],
4816
- "_mm256_mask_cvtsepi32_epi16"=>["AVX512VL", "AVX512F"],
4817
- "_mm256_mask_cvtsepi32_storeu_epi16"=>["AVX512VL", "AVX512F"],
4818
- "_mm256_maskz_cvtsepi32_epi16"=>["AVX512VL", "AVX512F"],
4819
- "_mm_cvtsepi32_epi16"=>["AVX512VL", "AVX512F"],
4820
- "_mm_mask_cvtsepi32_epi16"=>["AVX512VL", "AVX512F"],
4821
- "_mm_mask_cvtsepi32_storeu_epi16"=>["AVX512VL", "AVX512F"],
4822
- "_mm_maskz_cvtsepi32_epi16"=>["AVX512VL", "AVX512F"],
4823
- "_mm256_cvtsepi64_epi8"=>["AVX512VL", "AVX512F"],
4824
- "_mm256_mask_cvtsepi64_epi8"=>["AVX512VL", "AVX512F"],
4825
- "_mm256_mask_cvtsepi64_storeu_epi8"=>["AVX512VL", "AVX512F"],
4826
- "_mm256_maskz_cvtsepi64_epi8"=>["AVX512VL", "AVX512F"],
4827
- "_mm_cvtsepi64_epi8"=>["AVX512VL", "AVX512F"],
4828
- "_mm_mask_cvtsepi64_epi8"=>["AVX512VL", "AVX512F"],
4829
- "_mm_mask_cvtsepi64_storeu_epi8"=>["AVX512VL", "AVX512F"],
4830
- "_mm_maskz_cvtsepi64_epi8"=>["AVX512VL", "AVX512F"],
4831
- "_mm256_cvtsepi64_epi32"=>["AVX512VL", "AVX512F"],
4832
- "_mm256_mask_cvtsepi64_epi32"=>["AVX512VL", "AVX512F"],
4833
- "_mm256_mask_cvtsepi64_storeu_epi32"=>["AVX512VL", "AVX512F"],
4834
- "_mm256_maskz_cvtsepi64_epi32"=>["AVX512VL", "AVX512F"],
4835
- "_mm_cvtsepi64_epi32"=>["AVX512VL", "AVX512F"],
4836
- "_mm_mask_cvtsepi64_epi32"=>["AVX512VL", "AVX512F"],
4837
- "_mm_mask_cvtsepi64_storeu_epi32"=>["AVX512VL", "AVX512F"],
4838
- "_mm_maskz_cvtsepi64_epi32"=>["AVX512VL", "AVX512F"],
4839
- "_mm256_cvtsepi64_epi16"=>["AVX512VL", "AVX512F"],
4840
- "_mm256_mask_cvtsepi64_epi16"=>["AVX512VL", "AVX512F"],
4841
- "_mm256_mask_cvtsepi64_storeu_epi16"=>["AVX512VL", "AVX512F"],
4842
- "_mm256_maskz_cvtsepi64_epi16"=>["AVX512VL", "AVX512F"],
4843
- "_mm_cvtsepi64_epi16"=>["AVX512VL", "AVX512F"],
4844
- "_mm_mask_cvtsepi64_epi16"=>["AVX512VL", "AVX512F"],
4845
- "_mm_mask_cvtsepi64_storeu_epi16"=>["AVX512VL", "AVX512F"],
4846
- "_mm_maskz_cvtsepi64_epi16"=>["AVX512VL", "AVX512F"],
4847
- "_mm256_cvtsepi16_epi8"=>["AVX512VL", "AVX512BW"],
4848
- "_mm256_mask_cvtsepi16_epi8"=>["AVX512VL", "AVX512BW"],
4849
- "_mm256_mask_cvtsepi16_storeu_epi8"=>["AVX512VL", "AVX512BW"],
4850
- "_mm256_maskz_cvtsepi16_epi8"=>["AVX512VL", "AVX512BW"],
4782
+ "_mm_movepi64_mask"=>[["AVX512VL", "AVX512DQ"]],
4783
+ "_mm256_cvtepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4784
+ "_mm256_mask_cvtepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4785
+ "_mm256_mask_cvtepi64_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4786
+ "_mm256_maskz_cvtepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4787
+ "_mm_cvtepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4788
+ "_mm_mask_cvtepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4789
+ "_mm_mask_cvtepi64_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4790
+ "_mm_maskz_cvtepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4791
+ "_mm256_cvtepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4792
+ "_mm256_mask_cvtepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4793
+ "_mm256_mask_cvtepi64_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
4794
+ "_mm256_maskz_cvtepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4795
+ "_mm_cvtepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4796
+ "_mm_mask_cvtepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4797
+ "_mm_mask_cvtepi64_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
4798
+ "_mm_maskz_cvtepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4799
+ "_mm256_cvtepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4800
+ "_mm256_mask_cvtepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4801
+ "_mm256_mask_cvtepi64_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4802
+ "_mm256_maskz_cvtepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4803
+ "_mm_cvtepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4804
+ "_mm_mask_cvtepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4805
+ "_mm_mask_cvtepi64_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4806
+ "_mm_maskz_cvtepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4807
+ "_mm256_cvtsepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4808
+ "_mm256_mask_cvtsepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4809
+ "_mm256_mask_cvtsepi32_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4810
+ "_mm256_maskz_cvtsepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4811
+ "_mm_cvtsepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4812
+ "_mm_mask_cvtsepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4813
+ "_mm_mask_cvtsepi32_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4814
+ "_mm_maskz_cvtsepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4815
+ "_mm256_cvtsepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4816
+ "_mm256_mask_cvtsepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4817
+ "_mm256_mask_cvtsepi32_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4818
+ "_mm256_maskz_cvtsepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4819
+ "_mm_cvtsepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4820
+ "_mm_mask_cvtsepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4821
+ "_mm_mask_cvtsepi32_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4822
+ "_mm_maskz_cvtsepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4823
+ "_mm256_cvtsepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4824
+ "_mm256_mask_cvtsepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4825
+ "_mm256_mask_cvtsepi64_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4826
+ "_mm256_maskz_cvtsepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4827
+ "_mm_cvtsepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4828
+ "_mm_mask_cvtsepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4829
+ "_mm_mask_cvtsepi64_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4830
+ "_mm_maskz_cvtsepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4831
+ "_mm256_cvtsepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4832
+ "_mm256_mask_cvtsepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4833
+ "_mm256_mask_cvtsepi64_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
4834
+ "_mm256_maskz_cvtsepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4835
+ "_mm_cvtsepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4836
+ "_mm_mask_cvtsepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4837
+ "_mm_mask_cvtsepi64_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
4838
+ "_mm_maskz_cvtsepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4839
+ "_mm256_cvtsepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4840
+ "_mm256_mask_cvtsepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4841
+ "_mm256_mask_cvtsepi64_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4842
+ "_mm256_maskz_cvtsepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4843
+ "_mm_cvtsepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4844
+ "_mm_mask_cvtsepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4845
+ "_mm_mask_cvtsepi64_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4846
+ "_mm_maskz_cvtsepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4847
+ "_mm256_cvtsepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4848
+ "_mm256_mask_cvtsepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4849
+ "_mm256_mask_cvtsepi16_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
4850
+ "_mm256_maskz_cvtsepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4851
4851
  "_mm512_cvtsepi16_epi8"=>["AVX512BW"],
4852
4852
  "_mm512_mask_cvtsepi16_epi8"=>["AVX512BW"],
4853
4853
  "_mm512_mask_cvtsepi16_storeu_epi8"=>["AVX512BW"],
4854
4854
  "_mm512_maskz_cvtsepi16_epi8"=>["AVX512BW"],
4855
- "_mm_cvtsepi16_epi8"=>["AVX512VL", "AVX512BW"],
4856
- "_mm_mask_cvtsepi16_epi8"=>["AVX512VL", "AVX512BW"],
4857
- "_mm_mask_cvtsepi16_storeu_epi8"=>["AVX512VL", "AVX512BW"],
4858
- "_mm_maskz_cvtsepi16_epi8"=>["AVX512VL", "AVX512BW"],
4859
- "_mm256_mask_cvtepi8_epi32"=>["AVX512VL", "AVX512F"],
4860
- "_mm256_maskz_cvtepi8_epi32"=>["AVX512VL", "AVX512F"],
4861
- "_mm_mask_cvtepi8_epi32"=>["AVX512VL", "AVX512F"],
4862
- "_mm_maskz_cvtepi8_epi32"=>["AVX512VL", "AVX512F"],
4863
- "_mm256_mask_cvtepi8_epi64"=>["AVX512VL", "AVX512F"],
4864
- "_mm256_maskz_cvtepi8_epi64"=>["AVX512VL", "AVX512F"],
4865
- "_mm_mask_cvtepi8_epi64"=>["AVX512VL", "AVX512F"],
4866
- "_mm_maskz_cvtepi8_epi64"=>["AVX512VL", "AVX512F"],
4867
- "_mm256_mask_cvtepi8_epi16"=>["AVX512VL", "AVX512BW"],
4868
- "_mm256_maskz_cvtepi8_epi16"=>["AVX512VL", "AVX512BW"],
4855
+ "_mm_cvtsepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4856
+ "_mm_mask_cvtsepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4857
+ "_mm_mask_cvtsepi16_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
4858
+ "_mm_maskz_cvtsepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4859
+ "_mm256_mask_cvtepi8_epi32"=>[["AVX512VL", "AVX512F"]],
4860
+ "_mm256_maskz_cvtepi8_epi32"=>[["AVX512VL", "AVX512F"]],
4861
+ "_mm_mask_cvtepi8_epi32"=>[["AVX512VL", "AVX512F"]],
4862
+ "_mm_maskz_cvtepi8_epi32"=>[["AVX512VL", "AVX512F"]],
4863
+ "_mm256_mask_cvtepi8_epi64"=>[["AVX512VL", "AVX512F"]],
4864
+ "_mm256_maskz_cvtepi8_epi64"=>[["AVX512VL", "AVX512F"]],
4865
+ "_mm_mask_cvtepi8_epi64"=>[["AVX512VL", "AVX512F"]],
4866
+ "_mm_maskz_cvtepi8_epi64"=>[["AVX512VL", "AVX512F"]],
4867
+ "_mm256_mask_cvtepi8_epi16"=>[["AVX512VL", "AVX512BW"]],
4868
+ "_mm256_maskz_cvtepi8_epi16"=>[["AVX512VL", "AVX512BW"]],
4869
4869
  "_mm512_cvtepi8_epi16"=>["AVX512BW"],
4870
4870
  "_mm512_mask_cvtepi8_epi16"=>["AVX512BW"],
4871
4871
  "_mm512_maskz_cvtepi8_epi16"=>["AVX512BW"],
4872
- "_mm_mask_cvtepi8_epi16"=>["AVX512VL", "AVX512BW"],
4873
- "_mm_maskz_cvtepi8_epi16"=>["AVX512VL", "AVX512BW"],
4874
- "_mm256_mask_cvtepi32_epi64"=>["AVX512VL", "AVX512F"],
4875
- "_mm256_maskz_cvtepi32_epi64"=>["AVX512VL", "AVX512F"],
4876
- "_mm_mask_cvtepi32_epi64"=>["AVX512VL", "AVX512F"],
4877
- "_mm_maskz_cvtepi32_epi64"=>["AVX512VL", "AVX512F"],
4878
- "_mm256_mask_cvtepi16_epi32"=>["AVX512VL", "AVX512F"],
4879
- "_mm256_maskz_cvtepi16_epi32"=>["AVX512VL", "AVX512F"],
4880
- "_mm_mask_cvtepi16_epi32"=>["AVX512VL", "AVX512F"],
4881
- "_mm_maskz_cvtepi16_epi32"=>["AVX512VL", "AVX512F"],
4882
- "_mm256_mask_cvtepi16_epi64"=>["AVX512VL", "AVX512F"],
4883
- "_mm256_maskz_cvtepi16_epi64"=>["AVX512VL", "AVX512F"],
4884
- "_mm_mask_cvtepi16_epi64"=>["AVX512VL", "AVX512F"],
4885
- "_mm_maskz_cvtepi16_epi64"=>["AVX512VL", "AVX512F"],
4886
- "_mm256_cvtusepi32_epi8"=>["AVX512VL", "AVX512F"],
4887
- "_mm256_mask_cvtusepi32_epi8"=>["AVX512VL", "AVX512F"],
4888
- "_mm256_mask_cvtusepi32_storeu_epi8"=>["AVX512VL", "AVX512F"],
4889
- "_mm256_maskz_cvtusepi32_epi8"=>["AVX512VL", "AVX512F"],
4890
- "_mm_cvtusepi32_epi8"=>["AVX512VL", "AVX512F"],
4891
- "_mm_mask_cvtusepi32_epi8"=>["AVX512VL", "AVX512F"],
4892
- "_mm_mask_cvtusepi32_storeu_epi8"=>["AVX512VL", "AVX512F"],
4893
- "_mm_maskz_cvtusepi32_epi8"=>["AVX512VL", "AVX512F"],
4894
- "_mm256_cvtusepi32_epi16"=>["AVX512VL", "AVX512F"],
4895
- "_mm256_mask_cvtusepi32_epi16"=>["AVX512VL", "AVX512F"],
4896
- "_mm256_mask_cvtusepi32_storeu_epi16"=>["AVX512VL", "AVX512F"],
4897
- "_mm256_maskz_cvtusepi32_epi16"=>["AVX512VL", "AVX512F"],
4898
- "_mm_cvtusepi32_epi16"=>["AVX512VL", "AVX512F"],
4899
- "_mm_mask_cvtusepi32_epi16"=>["AVX512VL", "AVX512F"],
4900
- "_mm_mask_cvtusepi32_storeu_epi16"=>["AVX512VL", "AVX512F"],
4901
- "_mm_maskz_cvtusepi32_epi16"=>["AVX512VL", "AVX512F"],
4902
- "_mm256_cvtusepi64_epi8"=>["AVX512VL", "AVX512F"],
4903
- "_mm256_mask_cvtusepi64_epi8"=>["AVX512VL", "AVX512F"],
4904
- "_mm256_mask_cvtusepi64_storeu_epi8"=>["AVX512VL", "AVX512F"],
4905
- "_mm256_maskz_cvtusepi64_epi8"=>["AVX512VL", "AVX512F"],
4906
- "_mm_cvtusepi64_epi8"=>["AVX512VL", "AVX512F"],
4907
- "_mm_mask_cvtusepi64_epi8"=>["AVX512VL", "AVX512F"],
4908
- "_mm_mask_cvtusepi64_storeu_epi8"=>["AVX512VL", "AVX512F"],
4909
- "_mm_maskz_cvtusepi64_epi8"=>["AVX512VL", "AVX512F"],
4910
- "_mm256_cvtusepi64_epi32"=>["AVX512VL", "AVX512F"],
4911
- "_mm256_mask_cvtusepi64_epi32"=>["AVX512VL", "AVX512F"],
4912
- "_mm256_mask_cvtusepi64_storeu_epi32"=>["AVX512VL", "AVX512F"],
4913
- "_mm256_maskz_cvtusepi64_epi32"=>["AVX512VL", "AVX512F"],
4914
- "_mm_cvtusepi64_epi32"=>["AVX512VL", "AVX512F"],
4915
- "_mm_mask_cvtusepi64_epi32"=>["AVX512VL", "AVX512F"],
4916
- "_mm_mask_cvtusepi64_storeu_epi32"=>["AVX512VL", "AVX512F"],
4917
- "_mm_maskz_cvtusepi64_epi32"=>["AVX512VL", "AVX512F"],
4918
- "_mm256_cvtusepi64_epi16"=>["AVX512VL", "AVX512F"],
4919
- "_mm256_mask_cvtusepi64_epi16"=>["AVX512VL", "AVX512F"],
4920
- "_mm256_mask_cvtusepi64_storeu_epi16"=>["AVX512VL", "AVX512F"],
4921
- "_mm256_maskz_cvtusepi64_epi16"=>["AVX512VL", "AVX512F"],
4922
- "_mm_cvtusepi64_epi16"=>["AVX512VL", "AVX512F"],
4923
- "_mm_mask_cvtusepi64_epi16"=>["AVX512VL", "AVX512F"],
4924
- "_mm_mask_cvtusepi64_storeu_epi16"=>["AVX512VL", "AVX512F"],
4925
- "_mm_maskz_cvtusepi64_epi16"=>["AVX512VL", "AVX512F"],
4926
- "_mm256_cvtusepi16_epi8"=>["AVX512VL", "AVX512BW"],
4927
- "_mm256_mask_cvtusepi16_epi8"=>["AVX512VL", "AVX512BW"],
4928
- "_mm256_mask_cvtusepi16_storeu_epi8"=>["AVX512VL", "AVX512BW"],
4929
- "_mm256_maskz_cvtusepi16_epi8"=>["AVX512VL", "AVX512BW"],
4872
+ "_mm_mask_cvtepi8_epi16"=>[["AVX512VL", "AVX512BW"]],
4873
+ "_mm_maskz_cvtepi8_epi16"=>[["AVX512VL", "AVX512BW"]],
4874
+ "_mm256_mask_cvtepi32_epi64"=>[["AVX512VL", "AVX512F"]],
4875
+ "_mm256_maskz_cvtepi32_epi64"=>[["AVX512VL", "AVX512F"]],
4876
+ "_mm_mask_cvtepi32_epi64"=>[["AVX512VL", "AVX512F"]],
4877
+ "_mm_maskz_cvtepi32_epi64"=>[["AVX512VL", "AVX512F"]],
4878
+ "_mm256_mask_cvtepi16_epi32"=>[["AVX512VL", "AVX512F"]],
4879
+ "_mm256_maskz_cvtepi16_epi32"=>[["AVX512VL", "AVX512F"]],
4880
+ "_mm_mask_cvtepi16_epi32"=>[["AVX512VL", "AVX512F"]],
4881
+ "_mm_maskz_cvtepi16_epi32"=>[["AVX512VL", "AVX512F"]],
4882
+ "_mm256_mask_cvtepi16_epi64"=>[["AVX512VL", "AVX512F"]],
4883
+ "_mm256_maskz_cvtepi16_epi64"=>[["AVX512VL", "AVX512F"]],
4884
+ "_mm_mask_cvtepi16_epi64"=>[["AVX512VL", "AVX512F"]],
4885
+ "_mm_maskz_cvtepi16_epi64"=>[["AVX512VL", "AVX512F"]],
4886
+ "_mm256_cvtusepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4887
+ "_mm256_mask_cvtusepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4888
+ "_mm256_mask_cvtusepi32_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4889
+ "_mm256_maskz_cvtusepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4890
+ "_mm_cvtusepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4891
+ "_mm_mask_cvtusepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4892
+ "_mm_mask_cvtusepi32_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4893
+ "_mm_maskz_cvtusepi32_epi8"=>[["AVX512VL", "AVX512F"]],
4894
+ "_mm256_cvtusepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4895
+ "_mm256_mask_cvtusepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4896
+ "_mm256_mask_cvtusepi32_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4897
+ "_mm256_maskz_cvtusepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4898
+ "_mm_cvtusepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4899
+ "_mm_mask_cvtusepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4900
+ "_mm_mask_cvtusepi32_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4901
+ "_mm_maskz_cvtusepi32_epi16"=>[["AVX512VL", "AVX512F"]],
4902
+ "_mm256_cvtusepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4903
+ "_mm256_mask_cvtusepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4904
+ "_mm256_mask_cvtusepi64_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4905
+ "_mm256_maskz_cvtusepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4906
+ "_mm_cvtusepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4907
+ "_mm_mask_cvtusepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4908
+ "_mm_mask_cvtusepi64_storeu_epi8"=>[["AVX512VL", "AVX512F"]],
4909
+ "_mm_maskz_cvtusepi64_epi8"=>[["AVX512VL", "AVX512F"]],
4910
+ "_mm256_cvtusepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4911
+ "_mm256_mask_cvtusepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4912
+ "_mm256_mask_cvtusepi64_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
4913
+ "_mm256_maskz_cvtusepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4914
+ "_mm_cvtusepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4915
+ "_mm_mask_cvtusepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4916
+ "_mm_mask_cvtusepi64_storeu_epi32"=>[["AVX512VL", "AVX512F"]],
4917
+ "_mm_maskz_cvtusepi64_epi32"=>[["AVX512VL", "AVX512F"]],
4918
+ "_mm256_cvtusepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4919
+ "_mm256_mask_cvtusepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4920
+ "_mm256_mask_cvtusepi64_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4921
+ "_mm256_maskz_cvtusepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4922
+ "_mm_cvtusepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4923
+ "_mm_mask_cvtusepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4924
+ "_mm_mask_cvtusepi64_storeu_epi16"=>[["AVX512VL", "AVX512F"]],
4925
+ "_mm_maskz_cvtusepi64_epi16"=>[["AVX512VL", "AVX512F"]],
4926
+ "_mm256_cvtusepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4927
+ "_mm256_mask_cvtusepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4928
+ "_mm256_mask_cvtusepi16_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
4929
+ "_mm256_maskz_cvtusepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4930
4930
  "_mm512_cvtusepi16_epi8"=>["AVX512BW"],
4931
4931
  "_mm512_mask_cvtusepi16_epi8"=>["AVX512BW"],
4932
4932
  "_mm512_mask_cvtusepi16_storeu_epi8"=>["AVX512BW"],
4933
4933
  "_mm512_maskz_cvtusepi16_epi8"=>["AVX512BW"],
4934
- "_mm_cvtusepi16_epi8"=>["AVX512VL", "AVX512BW"],
4935
- "_mm_mask_cvtusepi16_epi8"=>["AVX512VL", "AVX512BW"],
4936
- "_mm_mask_cvtusepi16_storeu_epi8"=>["AVX512VL", "AVX512BW"],
4937
- "_mm_maskz_cvtusepi16_epi8"=>["AVX512VL", "AVX512BW"],
4938
- "_mm256_movepi16_mask"=>["AVX512VL", "AVX512BW"],
4934
+ "_mm_cvtusepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4935
+ "_mm_mask_cvtusepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4936
+ "_mm_mask_cvtusepi16_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
4937
+ "_mm_maskz_cvtusepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4938
+ "_mm256_movepi16_mask"=>[["AVX512VL", "AVX512BW"]],
4939
4939
  "_mm512_movepi16_mask"=>["AVX512BW"],
4940
- "_mm_movepi16_mask"=>["AVX512VL", "AVX512BW"],
4941
- "_mm256_cvtepi16_epi8"=>["AVX512VL", "AVX512BW"],
4942
- "_mm256_mask_cvtepi16_epi8"=>["AVX512VL", "AVX512BW"],
4943
- "_mm256_mask_cvtepi16_storeu_epi8"=>["AVX512VL", "AVX512BW"],
4944
- "_mm256_maskz_cvtepi16_epi8"=>["AVX512VL", "AVX512BW"],
4940
+ "_mm_movepi16_mask"=>[["AVX512VL", "AVX512BW"]],
4941
+ "_mm256_cvtepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4942
+ "_mm256_mask_cvtepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4943
+ "_mm256_mask_cvtepi16_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
4944
+ "_mm256_maskz_cvtepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4945
4945
  "_mm512_cvtepi16_epi8"=>["AVX512BW"],
4946
4946
  "_mm512_mask_cvtepi16_epi8"=>["AVX512BW"],
4947
4947
  "_mm512_mask_cvtepi16_storeu_epi8"=>["AVX512BW"],
4948
4948
  "_mm512_maskz_cvtepi16_epi8"=>["AVX512BW"],
4949
- "_mm_cvtepi16_epi8"=>["AVX512VL", "AVX512BW"],
4950
- "_mm_mask_cvtepi16_epi8"=>["AVX512VL", "AVX512BW"],
4951
- "_mm_mask_cvtepi16_storeu_epi8"=>["AVX512VL", "AVX512BW"],
4952
- "_mm_maskz_cvtepi16_epi8"=>["AVX512VL", "AVX512BW"],
4953
- "_mm256_mask_cvtepu8_epi32"=>["AVX512VL", "AVX512F"],
4954
- "_mm256_maskz_cvtepu8_epi32"=>["AVX512VL", "AVX512F"],
4955
- "_mm_mask_cvtepu8_epi32"=>["AVX512VL", "AVX512F"],
4956
- "_mm_maskz_cvtepu8_epi32"=>["AVX512VL", "AVX512F"],
4957
- "_mm256_mask_cvtepu8_epi64"=>["AVX512VL", "AVX512F"],
4958
- "_mm256_maskz_cvtepu8_epi64"=>["AVX512VL", "AVX512F"],
4959
- "_mm_mask_cvtepu8_epi64"=>["AVX512VL", "AVX512F"],
4960
- "_mm_maskz_cvtepu8_epi64"=>["AVX512VL", "AVX512F"],
4961
- "_mm256_mask_cvtepu8_epi16"=>["AVX512VL", "AVX512BW"],
4962
- "_mm256_maskz_cvtepu8_epi16"=>["AVX512VL", "AVX512BW"],
4949
+ "_mm_cvtepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4950
+ "_mm_mask_cvtepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4951
+ "_mm_mask_cvtepi16_storeu_epi8"=>[["AVX512VL", "AVX512BW"]],
4952
+ "_mm_maskz_cvtepi16_epi8"=>[["AVX512VL", "AVX512BW"]],
4953
+ "_mm256_mask_cvtepu8_epi32"=>[["AVX512VL", "AVX512F"]],
4954
+ "_mm256_maskz_cvtepu8_epi32"=>[["AVX512VL", "AVX512F"]],
4955
+ "_mm_mask_cvtepu8_epi32"=>[["AVX512VL", "AVX512F"]],
4956
+ "_mm_maskz_cvtepu8_epi32"=>[["AVX512VL", "AVX512F"]],
4957
+ "_mm256_mask_cvtepu8_epi64"=>[["AVX512VL", "AVX512F"]],
4958
+ "_mm256_maskz_cvtepu8_epi64"=>[["AVX512VL", "AVX512F"]],
4959
+ "_mm_mask_cvtepu8_epi64"=>[["AVX512VL", "AVX512F"]],
4960
+ "_mm_maskz_cvtepu8_epi64"=>[["AVX512VL", "AVX512F"]],
4961
+ "_mm256_mask_cvtepu8_epi16"=>[["AVX512VL", "AVX512BW"]],
4962
+ "_mm256_maskz_cvtepu8_epi16"=>[["AVX512VL", "AVX512BW"]],
4963
4963
  "_mm512_cvtepu8_epi16"=>["AVX512BW"],
4964
4964
  "_mm512_mask_cvtepu8_epi16"=>["AVX512BW"],
4965
4965
  "_mm512_maskz_cvtepu8_epi16"=>["AVX512BW"],
4966
- "_mm_mask_cvtepu8_epi16"=>["AVX512VL", "AVX512BW"],
4967
- "_mm_maskz_cvtepu8_epi16"=>["AVX512VL", "AVX512BW"],
4968
- "_mm256_mask_cvtepu32_epi64"=>["AVX512VL", "AVX512F"],
4969
- "_mm256_maskz_cvtepu32_epi64"=>["AVX512VL", "AVX512F"],
4970
- "_mm_mask_cvtepu32_epi64"=>["AVX512VL", "AVX512F"],
4971
- "_mm_maskz_cvtepu32_epi64"=>["AVX512VL", "AVX512F"],
4972
- "_mm256_mask_cvtepu16_epi32"=>["AVX512VL", "AVX512F"],
4973
- "_mm256_maskz_cvtepu16_epi32"=>["AVX512VL", "AVX512F"],
4974
- "_mm_mask_cvtepu16_epi32"=>["AVX512VL", "AVX512F"],
4975
- "_mm_maskz_cvtepu16_epi32"=>["AVX512VL", "AVX512F"],
4976
- "_mm256_mask_cvtepu16_epi64"=>["AVX512VL", "AVX512F"],
4977
- "_mm256_maskz_cvtepu16_epi64"=>["AVX512VL", "AVX512F"],
4978
- "_mm_mask_cvtepu16_epi64"=>["AVX512VL", "AVX512F"],
4979
- "_mm_maskz_cvtepu16_epi64"=>["AVX512VL", "AVX512F"],
4980
- "_mm256_mask_mul_epi32"=>["AVX512VL", "AVX512F"],
4981
- "_mm256_maskz_mul_epi32"=>["AVX512VL", "AVX512F"],
4982
- "_mm_mask_mul_epi32"=>["AVX512VL", "AVX512F"],
4983
- "_mm_maskz_mul_epi32"=>["AVX512VL", "AVX512F"],
4984
- "_mm256_mask_mulhrs_epi16"=>["AVX512VL", "AVX512BW"],
4985
- "_mm256_maskz_mulhrs_epi16"=>["AVX512VL", "AVX512BW"],
4966
+ "_mm_mask_cvtepu8_epi16"=>[["AVX512VL", "AVX512BW"]],
4967
+ "_mm_maskz_cvtepu8_epi16"=>[["AVX512VL", "AVX512BW"]],
4968
+ "_mm256_mask_cvtepu32_epi64"=>[["AVX512VL", "AVX512F"]],
4969
+ "_mm256_maskz_cvtepu32_epi64"=>[["AVX512VL", "AVX512F"]],
4970
+ "_mm_mask_cvtepu32_epi64"=>[["AVX512VL", "AVX512F"]],
4971
+ "_mm_maskz_cvtepu32_epi64"=>[["AVX512VL", "AVX512F"]],
4972
+ "_mm256_mask_cvtepu16_epi32"=>[["AVX512VL", "AVX512F"]],
4973
+ "_mm256_maskz_cvtepu16_epi32"=>[["AVX512VL", "AVX512F"]],
4974
+ "_mm_mask_cvtepu16_epi32"=>[["AVX512VL", "AVX512F"]],
4975
+ "_mm_maskz_cvtepu16_epi32"=>[["AVX512VL", "AVX512F"]],
4976
+ "_mm256_mask_cvtepu16_epi64"=>[["AVX512VL", "AVX512F"]],
4977
+ "_mm256_maskz_cvtepu16_epi64"=>[["AVX512VL", "AVX512F"]],
4978
+ "_mm_mask_cvtepu16_epi64"=>[["AVX512VL", "AVX512F"]],
4979
+ "_mm_maskz_cvtepu16_epi64"=>[["AVX512VL", "AVX512F"]],
4980
+ "_mm256_mask_mul_epi32"=>[["AVX512VL", "AVX512F"]],
4981
+ "_mm256_maskz_mul_epi32"=>[["AVX512VL", "AVX512F"]],
4982
+ "_mm_mask_mul_epi32"=>[["AVX512VL", "AVX512F"]],
4983
+ "_mm_maskz_mul_epi32"=>[["AVX512VL", "AVX512F"]],
4984
+ "_mm256_mask_mulhrs_epi16"=>[["AVX512VL", "AVX512BW"]],
4985
+ "_mm256_maskz_mulhrs_epi16"=>[["AVX512VL", "AVX512BW"]],
4986
4986
  "_mm512_mask_mulhrs_epi16"=>["AVX512BW"],
4987
4987
  "_mm512_maskz_mulhrs_epi16"=>["AVX512BW"],
4988
4988
  "_mm512_mulhrs_epi16"=>["AVX512BW"],
4989
- "_mm_mask_mulhrs_epi16"=>["AVX512VL", "AVX512BW"],
4990
- "_mm_maskz_mulhrs_epi16"=>["AVX512VL", "AVX512BW"],
4991
- "_mm256_mask_mulhi_epu16"=>["AVX512VL", "AVX512BW"],
4992
- "_mm256_maskz_mulhi_epu16"=>["AVX512VL", "AVX512BW"],
4989
+ "_mm_mask_mulhrs_epi16"=>[["AVX512VL", "AVX512BW"]],
4990
+ "_mm_maskz_mulhrs_epi16"=>[["AVX512VL", "AVX512BW"]],
4991
+ "_mm256_mask_mulhi_epu16"=>[["AVX512VL", "AVX512BW"]],
4992
+ "_mm256_maskz_mulhi_epu16"=>[["AVX512VL", "AVX512BW"]],
4993
4993
  "_mm512_mask_mulhi_epu16"=>["AVX512BW"],
4994
4994
  "_mm512_maskz_mulhi_epu16"=>["AVX512BW"],
4995
4995
  "_mm512_mulhi_epu16"=>["AVX512BW"],
4996
- "_mm_mask_mulhi_epu16"=>["AVX512VL", "AVX512BW"],
4997
- "_mm_maskz_mulhi_epu16"=>["AVX512VL", "AVX512BW"],
4998
- "_mm256_mask_mulhi_epi16"=>["AVX512VL", "AVX512BW"],
4999
- "_mm256_maskz_mulhi_epi16"=>["AVX512VL", "AVX512BW"],
4996
+ "_mm_mask_mulhi_epu16"=>[["AVX512VL", "AVX512BW"]],
4997
+ "_mm_maskz_mulhi_epu16"=>[["AVX512VL", "AVX512BW"]],
4998
+ "_mm256_mask_mulhi_epi16"=>[["AVX512VL", "AVX512BW"]],
4999
+ "_mm256_maskz_mulhi_epi16"=>[["AVX512VL", "AVX512BW"]],
5000
5000
  "_mm512_mask_mulhi_epi16"=>["AVX512BW"],
5001
5001
  "_mm512_maskz_mulhi_epi16"=>["AVX512BW"],
5002
5002
  "_mm512_mulhi_epi16"=>["AVX512BW"],
5003
- "_mm_mask_mulhi_epi16"=>["AVX512VL", "AVX512BW"],
5004
- "_mm_maskz_mulhi_epi16"=>["AVX512VL", "AVX512BW"],
5005
- "_mm256_mask_mullo_epi32"=>["AVX512VL", "AVX512F"],
5006
- "_mm256_maskz_mullo_epi32"=>["AVX512VL", "AVX512F"],
5003
+ "_mm_mask_mulhi_epi16"=>[["AVX512VL", "AVX512BW"]],
5004
+ "_mm_maskz_mulhi_epi16"=>[["AVX512VL", "AVX512BW"]],
5005
+ "_mm256_mask_mullo_epi32"=>[["AVX512VL", "AVX512F"]],
5006
+ "_mm256_maskz_mullo_epi32"=>[["AVX512VL", "AVX512F"]],
5007
5007
  "_mm512_maskz_mullo_epi32"=>["AVX512F"],
5008
- "_mm_mask_mullo_epi32"=>["AVX512VL", "AVX512F"],
5009
- "_mm_maskz_mullo_epi32"=>["AVX512VL", "AVX512F"],
5010
- "_mm256_mask_mullo_epi64"=>["AVX512VL", "AVX512DQ"],
5011
- "_mm256_maskz_mullo_epi64"=>["AVX512VL", "AVX512DQ"],
5012
- "_mm256_mullo_epi64"=>["AVX512VL", "AVX512DQ"],
5008
+ "_mm_mask_mullo_epi32"=>[["AVX512VL", "AVX512F"]],
5009
+ "_mm_maskz_mullo_epi32"=>[["AVX512VL", "AVX512F"]],
5010
+ "_mm256_mask_mullo_epi64"=>[["AVX512VL", "AVX512DQ"]],
5011
+ "_mm256_maskz_mullo_epi64"=>[["AVX512VL", "AVX512DQ"]],
5012
+ "_mm256_mullo_epi64"=>[["AVX512VL", "AVX512DQ"]],
5013
5013
  "_mm512_mask_mullo_epi64"=>["AVX512DQ"],
5014
5014
  "_mm512_maskz_mullo_epi64"=>["AVX512DQ"],
5015
5015
  "_mm512_mullo_epi64"=>["AVX512DQ"],
5016
- "_mm_mask_mullo_epi64"=>["AVX512VL", "AVX512DQ"],
5017
- "_mm_maskz_mullo_epi64"=>["AVX512VL", "AVX512DQ"],
5018
- "_mm_mullo_epi64"=>["AVX512VL", "AVX512DQ"],
5019
- "_mm256_mask_mullo_epi16"=>["AVX512VL", "AVX512BW"],
5020
- "_mm256_maskz_mullo_epi16"=>["AVX512VL", "AVX512BW"],
5016
+ "_mm_mask_mullo_epi64"=>[["AVX512VL", "AVX512DQ"]],
5017
+ "_mm_maskz_mullo_epi64"=>[["AVX512VL", "AVX512DQ"]],
5018
+ "_mm_mullo_epi64"=>[["AVX512VL", "AVX512DQ"]],
5019
+ "_mm256_mask_mullo_epi16"=>[["AVX512VL", "AVX512BW"]],
5020
+ "_mm256_maskz_mullo_epi16"=>[["AVX512VL", "AVX512BW"]],
5021
5021
  "_mm512_mask_mullo_epi16"=>["AVX512BW"],
5022
5022
  "_mm512_maskz_mullo_epi16"=>["AVX512BW"],
5023
5023
  "_mm512_mullo_epi16"=>["AVX512BW"],
5024
- "_mm_mask_mullo_epi16"=>["AVX512VL", "AVX512BW"],
5025
- "_mm_maskz_mullo_epi16"=>["AVX512VL", "AVX512BW"],
5026
- "_mm256_mask_mul_epu32"=>["AVX512VL", "AVX512F"],
5027
- "_mm256_maskz_mul_epu32"=>["AVX512VL", "AVX512F"],
5028
- "_mm_mask_mul_epu32"=>["AVX512VL", "AVX512F"],
5029
- "_mm_maskz_mul_epu32"=>["AVX512VL", "AVX512F"],
5030
- "_mm256_mask_or_epi32"=>["AVX512VL", "AVX512F"],
5031
- "_mm256_maskz_or_epi32"=>["AVX512VL", "AVX512F"],
5032
- "_mm_mask_or_epi32"=>["AVX512VL", "AVX512F"],
5033
- "_mm_maskz_or_epi32"=>["AVX512VL", "AVX512F"],
5034
- "_mm256_mask_or_epi64"=>["AVX512VL", "AVX512F"],
5035
- "_mm256_maskz_or_epi64"=>["AVX512VL", "AVX512F"],
5036
- "_mm_mask_or_epi64"=>["AVX512VL", "AVX512F"],
5037
- "_mm_maskz_or_epi64"=>["AVX512VL", "AVX512F"],
5038
- "_mm256_mask_rol_epi32"=>["AVX512VL", "AVX512F"],
5039
- "_mm256_maskz_rol_epi32"=>["AVX512VL", "AVX512F"],
5040
- "_mm256_rol_epi32"=>["AVX512VL", "AVX512F"],
5041
- "_mm_mask_rol_epi32"=>["AVX512VL", "AVX512F"],
5042
- "_mm_maskz_rol_epi32"=>["AVX512VL", "AVX512F"],
5043
- "_mm_rol_epi32"=>["AVX512VL", "AVX512F"],
5044
- "_mm256_mask_rol_epi64"=>["AVX512VL", "AVX512F"],
5045
- "_mm256_maskz_rol_epi64"=>["AVX512VL", "AVX512F"],
5046
- "_mm256_rol_epi64"=>["AVX512VL", "AVX512F"],
5047
- "_mm_mask_rol_epi64"=>["AVX512VL", "AVX512F"],
5048
- "_mm_maskz_rol_epi64"=>["AVX512VL", "AVX512F"],
5049
- "_mm_rol_epi64"=>["AVX512VL", "AVX512F"],
5050
- "_mm256_mask_rolv_epi32"=>["AVX512VL", "AVX512F"],
5051
- "_mm256_maskz_rolv_epi32"=>["AVX512VL", "AVX512F"],
5052
- "_mm256_rolv_epi32"=>["AVX512VL", "AVX512F"],
5053
- "_mm_mask_rolv_epi32"=>["AVX512VL", "AVX512F"],
5054
- "_mm_maskz_rolv_epi32"=>["AVX512VL", "AVX512F"],
5055
- "_mm_rolv_epi32"=>["AVX512VL", "AVX512F"],
5056
- "_mm256_mask_rolv_epi64"=>["AVX512VL", "AVX512F"],
5057
- "_mm256_maskz_rolv_epi64"=>["AVX512VL", "AVX512F"],
5058
- "_mm256_rolv_epi64"=>["AVX512VL", "AVX512F"],
5059
- "_mm_mask_rolv_epi64"=>["AVX512VL", "AVX512F"],
5060
- "_mm_maskz_rolv_epi64"=>["AVX512VL", "AVX512F"],
5061
- "_mm_rolv_epi64"=>["AVX512VL", "AVX512F"],
5062
- "_mm256_mask_ror_epi32"=>["AVX512VL", "AVX512F"],
5063
- "_mm256_maskz_ror_epi32"=>["AVX512VL", "AVX512F"],
5064
- "_mm256_ror_epi32"=>["AVX512VL", "AVX512F"],
5065
- "_mm_mask_ror_epi32"=>["AVX512VL", "AVX512F"],
5066
- "_mm_maskz_ror_epi32"=>["AVX512VL", "AVX512F"],
5067
- "_mm_ror_epi32"=>["AVX512VL", "AVX512F"],
5068
- "_mm256_mask_ror_epi64"=>["AVX512VL", "AVX512F"],
5069
- "_mm256_maskz_ror_epi64"=>["AVX512VL", "AVX512F"],
5070
- "_mm256_ror_epi64"=>["AVX512VL", "AVX512F"],
5071
- "_mm_mask_ror_epi64"=>["AVX512VL", "AVX512F"],
5072
- "_mm_maskz_ror_epi64"=>["AVX512VL", "AVX512F"],
5073
- "_mm_ror_epi64"=>["AVX512VL", "AVX512F"],
5074
- "_mm256_mask_rorv_epi32"=>["AVX512VL", "AVX512F"],
5075
- "_mm256_maskz_rorv_epi32"=>["AVX512VL", "AVX512F"],
5076
- "_mm256_rorv_epi32"=>["AVX512VL", "AVX512F"],
5077
- "_mm_mask_rorv_epi32"=>["AVX512VL", "AVX512F"],
5078
- "_mm_maskz_rorv_epi32"=>["AVX512VL", "AVX512F"],
5079
- "_mm_rorv_epi32"=>["AVX512VL", "AVX512F"],
5080
- "_mm256_mask_rorv_epi64"=>["AVX512VL", "AVX512F"],
5081
- "_mm256_maskz_rorv_epi64"=>["AVX512VL", "AVX512F"],
5082
- "_mm256_rorv_epi64"=>["AVX512VL", "AVX512F"],
5083
- "_mm_mask_rorv_epi64"=>["AVX512VL", "AVX512F"],
5084
- "_mm_maskz_rorv_epi64"=>["AVX512VL", "AVX512F"],
5085
- "_mm_rorv_epi64"=>["AVX512VL", "AVX512F"],
5024
+ "_mm_mask_mullo_epi16"=>[["AVX512VL", "AVX512BW"]],
5025
+ "_mm_maskz_mullo_epi16"=>[["AVX512VL", "AVX512BW"]],
5026
+ "_mm256_mask_mul_epu32"=>[["AVX512VL", "AVX512F"]],
5027
+ "_mm256_maskz_mul_epu32"=>[["AVX512VL", "AVX512F"]],
5028
+ "_mm_mask_mul_epu32"=>[["AVX512VL", "AVX512F"]],
5029
+ "_mm_maskz_mul_epu32"=>[["AVX512VL", "AVX512F"]],
5030
+ "_mm256_mask_or_epi32"=>[["AVX512VL", "AVX512F"]],
5031
+ "_mm256_maskz_or_epi32"=>[["AVX512VL", "AVX512F"]],
5032
+ "_mm_mask_or_epi32"=>[["AVX512VL", "AVX512F"]],
5033
+ "_mm_maskz_or_epi32"=>[["AVX512VL", "AVX512F"]],
5034
+ "_mm256_mask_or_epi64"=>[["AVX512VL", "AVX512F"]],
5035
+ "_mm256_maskz_or_epi64"=>[["AVX512VL", "AVX512F"]],
5036
+ "_mm_mask_or_epi64"=>[["AVX512VL", "AVX512F"]],
5037
+ "_mm_maskz_or_epi64"=>[["AVX512VL", "AVX512F"]],
5038
+ "_mm256_mask_rol_epi32"=>[["AVX512VL", "AVX512F"]],
5039
+ "_mm256_maskz_rol_epi32"=>[["AVX512VL", "AVX512F"]],
5040
+ "_mm256_rol_epi32"=>[["AVX512VL", "AVX512F"]],
5041
+ "_mm_mask_rol_epi32"=>[["AVX512VL", "AVX512F"]],
5042
+ "_mm_maskz_rol_epi32"=>[["AVX512VL", "AVX512F"]],
5043
+ "_mm_rol_epi32"=>[["AVX512VL", "AVX512F"]],
5044
+ "_mm256_mask_rol_epi64"=>[["AVX512VL", "AVX512F"]],
5045
+ "_mm256_maskz_rol_epi64"=>[["AVX512VL", "AVX512F"]],
5046
+ "_mm256_rol_epi64"=>[["AVX512VL", "AVX512F"]],
5047
+ "_mm_mask_rol_epi64"=>[["AVX512VL", "AVX512F"]],
5048
+ "_mm_maskz_rol_epi64"=>[["AVX512VL", "AVX512F"]],
5049
+ "_mm_rol_epi64"=>[["AVX512VL", "AVX512F"]],
5050
+ "_mm256_mask_rolv_epi32"=>[["AVX512VL", "AVX512F"]],
5051
+ "_mm256_maskz_rolv_epi32"=>[["AVX512VL", "AVX512F"]],
5052
+ "_mm256_rolv_epi32"=>[["AVX512VL", "AVX512F"]],
5053
+ "_mm_mask_rolv_epi32"=>[["AVX512VL", "AVX512F"]],
5054
+ "_mm_maskz_rolv_epi32"=>[["AVX512VL", "AVX512F"]],
5055
+ "_mm_rolv_epi32"=>[["AVX512VL", "AVX512F"]],
5056
+ "_mm256_mask_rolv_epi64"=>[["AVX512VL", "AVX512F"]],
5057
+ "_mm256_maskz_rolv_epi64"=>[["AVX512VL", "AVX512F"]],
5058
+ "_mm256_rolv_epi64"=>[["AVX512VL", "AVX512F"]],
5059
+ "_mm_mask_rolv_epi64"=>[["AVX512VL", "AVX512F"]],
5060
+ "_mm_maskz_rolv_epi64"=>[["AVX512VL", "AVX512F"]],
5061
+ "_mm_rolv_epi64"=>[["AVX512VL", "AVX512F"]],
5062
+ "_mm256_mask_ror_epi32"=>[["AVX512VL", "AVX512F"]],
5063
+ "_mm256_maskz_ror_epi32"=>[["AVX512VL", "AVX512F"]],
5064
+ "_mm256_ror_epi32"=>[["AVX512VL", "AVX512F"]],
5065
+ "_mm_mask_ror_epi32"=>[["AVX512VL", "AVX512F"]],
5066
+ "_mm_maskz_ror_epi32"=>[["AVX512VL", "AVX512F"]],
5067
+ "_mm_ror_epi32"=>[["AVX512VL", "AVX512F"]],
5068
+ "_mm256_mask_ror_epi64"=>[["AVX512VL", "AVX512F"]],
5069
+ "_mm256_maskz_ror_epi64"=>[["AVX512VL", "AVX512F"]],
5070
+ "_mm256_ror_epi64"=>[["AVX512VL", "AVX512F"]],
5071
+ "_mm_mask_ror_epi64"=>[["AVX512VL", "AVX512F"]],
5072
+ "_mm_maskz_ror_epi64"=>[["AVX512VL", "AVX512F"]],
5073
+ "_mm_ror_epi64"=>[["AVX512VL", "AVX512F"]],
5074
+ "_mm256_mask_rorv_epi32"=>[["AVX512VL", "AVX512F"]],
5075
+ "_mm256_maskz_rorv_epi32"=>[["AVX512VL", "AVX512F"]],
5076
+ "_mm256_rorv_epi32"=>[["AVX512VL", "AVX512F"]],
5077
+ "_mm_mask_rorv_epi32"=>[["AVX512VL", "AVX512F"]],
5078
+ "_mm_maskz_rorv_epi32"=>[["AVX512VL", "AVX512F"]],
5079
+ "_mm_rorv_epi32"=>[["AVX512VL", "AVX512F"]],
5080
+ "_mm256_mask_rorv_epi64"=>[["AVX512VL", "AVX512F"]],
5081
+ "_mm256_maskz_rorv_epi64"=>[["AVX512VL", "AVX512F"]],
5082
+ "_mm256_rorv_epi64"=>[["AVX512VL", "AVX512F"]],
5083
+ "_mm_mask_rorv_epi64"=>[["AVX512VL", "AVX512F"]],
5084
+ "_mm_maskz_rorv_epi64"=>[["AVX512VL", "AVX512F"]],
5085
+ "_mm_rorv_epi64"=>[["AVX512VL", "AVX512F"]],
5086
5086
  "_mm512_sad_epu8"=>["AVX512BW"],
5087
- "_mm256_i32scatter_epi32"=>["AVX512VL", "AVX512F"],
5088
- "_mm256_mask_i32scatter_epi32"=>["AVX512VL", "AVX512F"],
5089
- "_mm_i32scatter_epi32"=>["AVX512VL", "AVX512F"],
5090
- "_mm_mask_i32scatter_epi32"=>["AVX512VL", "AVX512F"],
5091
- "_mm256_i32scatter_epi64"=>["AVX512VL", "AVX512F"],
5092
- "_mm256_mask_i32scatter_epi64"=>["AVX512VL", "AVX512F"],
5093
- "_mm_i32scatter_epi64"=>["AVX512VL", "AVX512F"],
5094
- "_mm_mask_i32scatter_epi64"=>["AVX512VL", "AVX512F"],
5095
- "_mm256_i64scatter_epi32"=>["AVX512VL", "AVX512F"],
5096
- "_mm256_mask_i64scatter_epi32"=>["AVX512VL", "AVX512F"],
5097
- "_mm_i64scatter_epi32"=>["AVX512VL", "AVX512F"],
5098
- "_mm_mask_i64scatter_epi32"=>["AVX512VL", "AVX512F"],
5099
- "_mm256_i64scatter_epi64"=>["AVX512VL", "AVX512F"],
5100
- "_mm256_mask_i64scatter_epi64"=>["AVX512VL", "AVX512F"],
5101
- "_mm_i64scatter_epi64"=>["AVX512VL", "AVX512F"],
5102
- "_mm_mask_i64scatter_epi64"=>["AVX512VL", "AVX512F"],
5103
- "_mm256_mask_shuffle_epi8"=>["AVX512VL", "AVX512BW"],
5104
- "_mm256_maskz_shuffle_epi8"=>["AVX512VL", "AVX512BW"],
5087
+ "_mm256_i32scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5088
+ "_mm256_mask_i32scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5089
+ "_mm_i32scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5090
+ "_mm_mask_i32scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5091
+ "_mm256_i32scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5092
+ "_mm256_mask_i32scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5093
+ "_mm_i32scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5094
+ "_mm_mask_i32scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5095
+ "_mm256_i64scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5096
+ "_mm256_mask_i64scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5097
+ "_mm_i64scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5098
+ "_mm_mask_i64scatter_epi32"=>[["AVX512VL", "AVX512F"]],
5099
+ "_mm256_i64scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5100
+ "_mm256_mask_i64scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5101
+ "_mm_i64scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5102
+ "_mm_mask_i64scatter_epi64"=>[["AVX512VL", "AVX512F"]],
5103
+ "_mm256_mask_shuffle_epi8"=>[["AVX512VL", "AVX512BW"]],
5104
+ "_mm256_maskz_shuffle_epi8"=>[["AVX512VL", "AVX512BW"]],
5105
5105
  "_mm512_mask_shuffle_epi8"=>["AVX512BW"],
5106
5106
  "_mm512_maskz_shuffle_epi8"=>["AVX512BW"],
5107
5107
  "_mm512_shuffle_epi8"=>["AVX512BW"],
5108
- "_mm_mask_shuffle_epi8"=>["AVX512VL", "AVX512BW"],
5109
- "_mm_maskz_shuffle_epi8"=>["AVX512VL", "AVX512BW"],
5110
- "_mm256_mask_shuffle_epi32"=>["AVX512VL", "AVX512F"],
5111
- "_mm256_maskz_shuffle_epi32"=>["AVX512VL", "AVX512F"],
5112
- "_mm_mask_shuffle_epi32"=>["AVX512VL", "AVX512F"],
5113
- "_mm_maskz_shuffle_epi32"=>["AVX512VL", "AVX512F"],
5114
- "_mm256_mask_shufflehi_epi16"=>["AVX512VL", "AVX512BW"],
5115
- "_mm256_maskz_shufflehi_epi16"=>["AVX512VL", "AVX512BW"],
5108
+ "_mm_mask_shuffle_epi8"=>[["AVX512VL", "AVX512BW"]],
5109
+ "_mm_maskz_shuffle_epi8"=>[["AVX512VL", "AVX512BW"]],
5110
+ "_mm256_mask_shuffle_epi32"=>[["AVX512VL", "AVX512F"]],
5111
+ "_mm256_maskz_shuffle_epi32"=>[["AVX512VL", "AVX512F"]],
5112
+ "_mm_mask_shuffle_epi32"=>[["AVX512VL", "AVX512F"]],
5113
+ "_mm_maskz_shuffle_epi32"=>[["AVX512VL", "AVX512F"]],
5114
+ "_mm256_mask_shufflehi_epi16"=>[["AVX512VL", "AVX512BW"]],
5115
+ "_mm256_maskz_shufflehi_epi16"=>[["AVX512VL", "AVX512BW"]],
5116
5116
  "_mm512_mask_shufflehi_epi16"=>["AVX512BW"],
5117
5117
  "_mm512_maskz_shufflehi_epi16"=>["AVX512BW"],
5118
5118
  "_mm512_shufflehi_epi16"=>["AVX512BW"],
5119
- "_mm_mask_shufflehi_epi16"=>["AVX512VL", "AVX512BW"],
5120
- "_mm_maskz_shufflehi_epi16"=>["AVX512VL", "AVX512BW"],
5121
- "_mm256_mask_shufflelo_epi16"=>["AVX512VL", "AVX512BW"],
5122
- "_mm256_maskz_shufflelo_epi16"=>["AVX512VL", "AVX512BW"],
5119
+ "_mm_mask_shufflehi_epi16"=>[["AVX512VL", "AVX512BW"]],
5120
+ "_mm_maskz_shufflehi_epi16"=>[["AVX512VL", "AVX512BW"]],
5121
+ "_mm256_mask_shufflelo_epi16"=>[["AVX512VL", "AVX512BW"]],
5122
+ "_mm256_maskz_shufflelo_epi16"=>[["AVX512VL", "AVX512BW"]],
5123
5123
  "_mm512_mask_shufflelo_epi16"=>["AVX512BW"],
5124
5124
  "_mm512_maskz_shufflelo_epi16"=>["AVX512BW"],
5125
5125
  "_mm512_shufflelo_epi16"=>["AVX512BW"],
5126
- "_mm_mask_shufflelo_epi16"=>["AVX512VL", "AVX512BW"],
5127
- "_mm_maskz_shufflelo_epi16"=>["AVX512VL", "AVX512BW"],
5128
- "_mm256_mask_sll_epi32"=>["AVX512VL", "AVX512F"],
5129
- "_mm256_mask_slli_epi32"=>["AVX512VL", "AVX512F"],
5130
- "_mm256_maskz_sll_epi32"=>["AVX512VL", "AVX512F"],
5131
- "_mm256_maskz_slli_epi32"=>["AVX512VL", "AVX512F"],
5132
- "_mm_mask_sll_epi32"=>["AVX512VL", "AVX512F"],
5133
- "_mm_mask_slli_epi32"=>["AVX512VL", "AVX512F"],
5134
- "_mm_maskz_sll_epi32"=>["AVX512VL", "AVX512F"],
5135
- "_mm_maskz_slli_epi32"=>["AVX512VL", "AVX512F"],
5126
+ "_mm_mask_shufflelo_epi16"=>[["AVX512VL", "AVX512BW"]],
5127
+ "_mm_maskz_shufflelo_epi16"=>[["AVX512VL", "AVX512BW"]],
5128
+ "_mm256_mask_sll_epi32"=>[["AVX512VL", "AVX512F"]],
5129
+ "_mm256_mask_slli_epi32"=>[["AVX512VL", "AVX512F"]],
5130
+ "_mm256_maskz_sll_epi32"=>[["AVX512VL", "AVX512F"]],
5131
+ "_mm256_maskz_slli_epi32"=>[["AVX512VL", "AVX512F"]],
5132
+ "_mm_mask_sll_epi32"=>[["AVX512VL", "AVX512F"]],
5133
+ "_mm_mask_slli_epi32"=>[["AVX512VL", "AVX512F"]],
5134
+ "_mm_maskz_sll_epi32"=>[["AVX512VL", "AVX512F"]],
5135
+ "_mm_maskz_slli_epi32"=>[["AVX512VL", "AVX512F"]],
5136
5136
  "_mm512_bslli_epi128"=>["AVX512BW"],
5137
- "_mm256_mask_sll_epi64"=>["AVX512VL", "AVX512F"],
5138
- "_mm256_mask_slli_epi64"=>["AVX512VL", "AVX512F"],
5139
- "_mm256_maskz_sll_epi64"=>["AVX512VL", "AVX512F"],
5140
- "_mm256_maskz_slli_epi64"=>["AVX512VL", "AVX512F"],
5141
- "_mm_mask_sll_epi64"=>["AVX512VL", "AVX512F"],
5142
- "_mm_mask_slli_epi64"=>["AVX512VL", "AVX512F"],
5143
- "_mm_maskz_sll_epi64"=>["AVX512VL", "AVX512F"],
5144
- "_mm_maskz_slli_epi64"=>["AVX512VL", "AVX512F"],
5145
- "_mm256_mask_sllv_epi32"=>["AVX512VL", "AVX512F"],
5146
- "_mm256_maskz_sllv_epi32"=>["AVX512VL", "AVX512F"],
5147
- "_mm_mask_sllv_epi32"=>["AVX512VL", "AVX512F"],
5148
- "_mm_maskz_sllv_epi32"=>["AVX512VL", "AVX512F"],
5149
- "_mm256_mask_sllv_epi64"=>["AVX512VL", "AVX512F"],
5150
- "_mm256_maskz_sllv_epi64"=>["AVX512VL", "AVX512F"],
5151
- "_mm_mask_sllv_epi64"=>["AVX512VL", "AVX512F"],
5152
- "_mm_maskz_sllv_epi64"=>["AVX512VL", "AVX512F"],
5153
- "_mm256_mask_sllv_epi16"=>["AVX512VL", "AVX512BW"],
5154
- "_mm256_maskz_sllv_epi16"=>["AVX512VL", "AVX512BW"],
5155
- "_mm256_sllv_epi16"=>["AVX512VL", "AVX512BW"],
5137
+ "_mm256_mask_sll_epi64"=>[["AVX512VL", "AVX512F"]],
5138
+ "_mm256_mask_slli_epi64"=>[["AVX512VL", "AVX512F"]],
5139
+ "_mm256_maskz_sll_epi64"=>[["AVX512VL", "AVX512F"]],
5140
+ "_mm256_maskz_slli_epi64"=>[["AVX512VL", "AVX512F"]],
5141
+ "_mm_mask_sll_epi64"=>[["AVX512VL", "AVX512F"]],
5142
+ "_mm_mask_slli_epi64"=>[["AVX512VL", "AVX512F"]],
5143
+ "_mm_maskz_sll_epi64"=>[["AVX512VL", "AVX512F"]],
5144
+ "_mm_maskz_slli_epi64"=>[["AVX512VL", "AVX512F"]],
5145
+ "_mm256_mask_sllv_epi32"=>[["AVX512VL", "AVX512F"]],
5146
+ "_mm256_maskz_sllv_epi32"=>[["AVX512VL", "AVX512F"]],
5147
+ "_mm_mask_sllv_epi32"=>[["AVX512VL", "AVX512F"]],
5148
+ "_mm_maskz_sllv_epi32"=>[["AVX512VL", "AVX512F"]],
5149
+ "_mm256_mask_sllv_epi64"=>[["AVX512VL", "AVX512F"]],
5150
+ "_mm256_maskz_sllv_epi64"=>[["AVX512VL", "AVX512F"]],
5151
+ "_mm_mask_sllv_epi64"=>[["AVX512VL", "AVX512F"]],
5152
+ "_mm_maskz_sllv_epi64"=>[["AVX512VL", "AVX512F"]],
5153
+ "_mm256_mask_sllv_epi16"=>[["AVX512VL", "AVX512BW"]],
5154
+ "_mm256_maskz_sllv_epi16"=>[["AVX512VL", "AVX512BW"]],
5155
+ "_mm256_sllv_epi16"=>[["AVX512VL", "AVX512BW"]],
5156
5156
  "_mm512_mask_sllv_epi16"=>["AVX512BW"],
5157
5157
  "_mm512_maskz_sllv_epi16"=>["AVX512BW"],
5158
5158
  "_mm512_sllv_epi16"=>["AVX512BW"],
5159
- "_mm_mask_sllv_epi16"=>["AVX512VL", "AVX512BW"],
5160
- "_mm_maskz_sllv_epi16"=>["AVX512VL", "AVX512BW"],
5161
- "_mm_sllv_epi16"=>["AVX512VL", "AVX512BW"],
5162
- "_mm256_mask_sll_epi16"=>["AVX512VL", "AVX512BW"],
5163
- "_mm256_mask_slli_epi16"=>["AVX512VL", "AVX512BW"],
5164
- "_mm256_maskz_sll_epi16"=>["AVX512VL", "AVX512BW"],
5165
- "_mm256_maskz_slli_epi16"=>["AVX512VL", "AVX512BW"],
5159
+ "_mm_mask_sllv_epi16"=>[["AVX512VL", "AVX512BW"]],
5160
+ "_mm_maskz_sllv_epi16"=>[["AVX512VL", "AVX512BW"]],
5161
+ "_mm_sllv_epi16"=>[["AVX512VL", "AVX512BW"]],
5162
+ "_mm256_mask_sll_epi16"=>[["AVX512VL", "AVX512BW"]],
5163
+ "_mm256_mask_slli_epi16"=>[["AVX512VL", "AVX512BW"]],
5164
+ "_mm256_maskz_sll_epi16"=>[["AVX512VL", "AVX512BW"]],
5165
+ "_mm256_maskz_slli_epi16"=>[["AVX512VL", "AVX512BW"]],
5166
5166
  "_mm512_mask_sll_epi16"=>["AVX512BW"],
5167
5167
  "_mm512_mask_slli_epi16"=>["AVX512BW"],
5168
5168
  "_mm512_maskz_sll_epi16"=>["AVX512BW"],
5169
5169
  "_mm512_maskz_slli_epi16"=>["AVX512BW"],
5170
5170
  "_mm512_sll_epi16"=>["AVX512BW"],
5171
5171
  "_mm512_slli_epi16"=>["AVX512BW"],
5172
- "_mm_mask_sll_epi16"=>["AVX512VL", "AVX512BW"],
5173
- "_mm_mask_slli_epi16"=>["AVX512VL", "AVX512BW"],
5174
- "_mm_maskz_sll_epi16"=>["AVX512VL", "AVX512BW"],
5175
- "_mm_maskz_slli_epi16"=>["AVX512VL", "AVX512BW"],
5176
- "_mm256_mask_sra_epi32"=>["AVX512VL", "AVX512F"],
5177
- "_mm256_mask_srai_epi32"=>["AVX512VL", "AVX512F"],
5178
- "_mm256_maskz_sra_epi32"=>["AVX512VL", "AVX512F"],
5179
- "_mm256_maskz_srai_epi32"=>["AVX512VL", "AVX512F"],
5180
- "_mm_mask_sra_epi32"=>["AVX512VL", "AVX512F"],
5181
- "_mm_mask_srai_epi32"=>["AVX512VL", "AVX512F"],
5182
- "_mm_maskz_sra_epi32"=>["AVX512VL", "AVX512F"],
5183
- "_mm_maskz_srai_epi32"=>["AVX512VL", "AVX512F"],
5184
- "_mm256_mask_sra_epi64"=>["AVX512VL", "AVX512F"],
5185
- "_mm256_mask_srai_epi64"=>["AVX512VL", "AVX512F"],
5186
- "_mm256_maskz_sra_epi64"=>["AVX512VL", "AVX512F"],
5187
- "_mm256_maskz_srai_epi64"=>["AVX512VL", "AVX512F"],
5188
- "_mm256_sra_epi64"=>["AVX512VL", "AVX512F"],
5189
- "_mm256_srai_epi64"=>["AVX512VL", "AVX512F"],
5190
- "_mm_mask_sra_epi64"=>["AVX512VL", "AVX512F"],
5191
- "_mm_mask_srai_epi64"=>["AVX512VL", "AVX512F"],
5192
- "_mm_maskz_sra_epi64"=>["AVX512VL", "AVX512F"],
5193
- "_mm_maskz_srai_epi64"=>["AVX512VL", "AVX512F"],
5194
- "_mm_sra_epi64"=>["AVX512VL", "AVX512F"],
5195
- "_mm_srai_epi64"=>["AVX512VL", "AVX512F"],
5196
- "_mm256_mask_srav_epi32"=>["AVX512VL", "AVX512F"],
5197
- "_mm256_maskz_srav_epi32"=>["AVX512VL", "AVX512F"],
5198
- "_mm_mask_srav_epi32"=>["AVX512VL", "AVX512F"],
5199
- "_mm_maskz_srav_epi32"=>["AVX512VL", "AVX512F"],
5200
- "_mm256_mask_srav_epi64"=>["AVX512VL", "AVX512F"],
5201
- "_mm256_maskz_srav_epi64"=>["AVX512VL", "AVX512F"],
5202
- "_mm256_srav_epi64"=>["AVX512VL", "AVX512F"],
5203
- "_mm_mask_srav_epi64"=>["AVX512VL", "AVX512F"],
5204
- "_mm_maskz_srav_epi64"=>["AVX512VL", "AVX512F"],
5205
- "_mm_srav_epi64"=>["AVX512VL", "AVX512F"],
5206
- "_mm256_mask_srav_epi16"=>["AVX512VL", "AVX512BW"],
5207
- "_mm256_maskz_srav_epi16"=>["AVX512VL", "AVX512BW"],
5208
- "_mm256_srav_epi16"=>["AVX512VL", "AVX512BW"],
5172
+ "_mm_mask_sll_epi16"=>[["AVX512VL", "AVX512BW"]],
5173
+ "_mm_mask_slli_epi16"=>[["AVX512VL", "AVX512BW"]],
5174
+ "_mm_maskz_sll_epi16"=>[["AVX512VL", "AVX512BW"]],
5175
+ "_mm_maskz_slli_epi16"=>[["AVX512VL", "AVX512BW"]],
5176
+ "_mm256_mask_sra_epi32"=>[["AVX512VL", "AVX512F"]],
5177
+ "_mm256_mask_srai_epi32"=>[["AVX512VL", "AVX512F"]],
5178
+ "_mm256_maskz_sra_epi32"=>[["AVX512VL", "AVX512F"]],
5179
+ "_mm256_maskz_srai_epi32"=>[["AVX512VL", "AVX512F"]],
5180
+ "_mm_mask_sra_epi32"=>[["AVX512VL", "AVX512F"]],
5181
+ "_mm_mask_srai_epi32"=>[["AVX512VL", "AVX512F"]],
5182
+ "_mm_maskz_sra_epi32"=>[["AVX512VL", "AVX512F"]],
5183
+ "_mm_maskz_srai_epi32"=>[["AVX512VL", "AVX512F"]],
5184
+ "_mm256_mask_sra_epi64"=>[["AVX512VL", "AVX512F"]],
5185
+ "_mm256_mask_srai_epi64"=>[["AVX512VL", "AVX512F"]],
5186
+ "_mm256_maskz_sra_epi64"=>[["AVX512VL", "AVX512F"]],
5187
+ "_mm256_maskz_srai_epi64"=>[["AVX512VL", "AVX512F"]],
5188
+ "_mm256_sra_epi64"=>[["AVX512VL", "AVX512F"]],
5189
+ "_mm256_srai_epi64"=>[["AVX512VL", "AVX512F"]],
5190
+ "_mm_mask_sra_epi64"=>[["AVX512VL", "AVX512F"]],
5191
+ "_mm_mask_srai_epi64"=>[["AVX512VL", "AVX512F"]],
5192
+ "_mm_maskz_sra_epi64"=>[["AVX512VL", "AVX512F"]],
5193
+ "_mm_maskz_srai_epi64"=>[["AVX512VL", "AVX512F"]],
5194
+ "_mm_sra_epi64"=>[["AVX512VL", "AVX512F"]],
5195
+ "_mm_srai_epi64"=>[["AVX512VL", "AVX512F"]],
5196
+ "_mm256_mask_srav_epi32"=>[["AVX512VL", "AVX512F"]],
5197
+ "_mm256_maskz_srav_epi32"=>[["AVX512VL", "AVX512F"]],
5198
+ "_mm_mask_srav_epi32"=>[["AVX512VL", "AVX512F"]],
5199
+ "_mm_maskz_srav_epi32"=>[["AVX512VL", "AVX512F"]],
5200
+ "_mm256_mask_srav_epi64"=>[["AVX512VL", "AVX512F"]],
5201
+ "_mm256_maskz_srav_epi64"=>[["AVX512VL", "AVX512F"]],
5202
+ "_mm256_srav_epi64"=>[["AVX512VL", "AVX512F"]],
5203
+ "_mm_mask_srav_epi64"=>[["AVX512VL", "AVX512F"]],
5204
+ "_mm_maskz_srav_epi64"=>[["AVX512VL", "AVX512F"]],
5205
+ "_mm_srav_epi64"=>[["AVX512VL", "AVX512F"]],
5206
+ "_mm256_mask_srav_epi16"=>[["AVX512VL", "AVX512BW"]],
5207
+ "_mm256_maskz_srav_epi16"=>[["AVX512VL", "AVX512BW"]],
5208
+ "_mm256_srav_epi16"=>[["AVX512VL", "AVX512BW"]],
5209
5209
  "_mm512_mask_srav_epi16"=>["AVX512BW"],
5210
5210
  "_mm512_maskz_srav_epi16"=>["AVX512BW"],
5211
5211
  "_mm512_srav_epi16"=>["AVX512BW"],
5212
- "_mm_mask_srav_epi16"=>["AVX512VL", "AVX512BW"],
5213
- "_mm_maskz_srav_epi16"=>["AVX512VL", "AVX512BW"],
5214
- "_mm_srav_epi16"=>["AVX512VL", "AVX512BW"],
5215
- "_mm256_mask_sra_epi16"=>["AVX512VL", "AVX512BW"],
5216
- "_mm256_mask_srai_epi16"=>["AVX512VL", "AVX512BW"],
5217
- "_mm256_maskz_sra_epi16"=>["AVX512VL", "AVX512BW"],
5218
- "_mm256_maskz_srai_epi16"=>["AVX512VL", "AVX512BW"],
5212
+ "_mm_mask_srav_epi16"=>[["AVX512VL", "AVX512BW"]],
5213
+ "_mm_maskz_srav_epi16"=>[["AVX512VL", "AVX512BW"]],
5214
+ "_mm_srav_epi16"=>[["AVX512VL", "AVX512BW"]],
5215
+ "_mm256_mask_sra_epi16"=>[["AVX512VL", "AVX512BW"]],
5216
+ "_mm256_mask_srai_epi16"=>[["AVX512VL", "AVX512BW"]],
5217
+ "_mm256_maskz_sra_epi16"=>[["AVX512VL", "AVX512BW"]],
5218
+ "_mm256_maskz_srai_epi16"=>[["AVX512VL", "AVX512BW"]],
5219
5219
  "_mm512_mask_sra_epi16"=>["AVX512BW"],
5220
5220
  "_mm512_mask_srai_epi16"=>["AVX512BW"],
5221
5221
  "_mm512_maskz_sra_epi16"=>["AVX512BW"],
5222
5222
  "_mm512_maskz_srai_epi16"=>["AVX512BW"],
5223
5223
  "_mm512_sra_epi16"=>["AVX512BW"],
5224
5224
  "_mm512_srai_epi16"=>["AVX512BW"],
5225
- "_mm_mask_sra_epi16"=>["AVX512VL", "AVX512BW"],
5226
- "_mm_mask_srai_epi16"=>["AVX512VL", "AVX512BW"],
5227
- "_mm_maskz_sra_epi16"=>["AVX512VL", "AVX512BW"],
5228
- "_mm_maskz_srai_epi16"=>["AVX512VL", "AVX512BW"],
5229
- "_mm256_mask_srl_epi32"=>["AVX512VL", "AVX512F"],
5230
- "_mm256_mask_srli_epi32"=>["AVX512VL", "AVX512F"],
5231
- "_mm256_maskz_srl_epi32"=>["AVX512VL", "AVX512F"],
5232
- "_mm256_maskz_srli_epi32"=>["AVX512VL", "AVX512F"],
5233
- "_mm_mask_srl_epi32"=>["AVX512VL", "AVX512F"],
5234
- "_mm_mask_srli_epi32"=>["AVX512VL", "AVX512F"],
5235
- "_mm_maskz_srl_epi32"=>["AVX512VL", "AVX512F"],
5236
- "_mm_maskz_srli_epi32"=>["AVX512VL", "AVX512F"],
5225
+ "_mm_mask_sra_epi16"=>[["AVX512VL", "AVX512BW"]],
5226
+ "_mm_mask_srai_epi16"=>[["AVX512VL", "AVX512BW"]],
5227
+ "_mm_maskz_sra_epi16"=>[["AVX512VL", "AVX512BW"]],
5228
+ "_mm_maskz_srai_epi16"=>[["AVX512VL", "AVX512BW"]],
5229
+ "_mm256_mask_srl_epi32"=>[["AVX512VL", "AVX512F"]],
5230
+ "_mm256_mask_srli_epi32"=>[["AVX512VL", "AVX512F"]],
5231
+ "_mm256_maskz_srl_epi32"=>[["AVX512VL", "AVX512F"]],
5232
+ "_mm256_maskz_srli_epi32"=>[["AVX512VL", "AVX512F"]],
5233
+ "_mm_mask_srl_epi32"=>[["AVX512VL", "AVX512F"]],
5234
+ "_mm_mask_srli_epi32"=>[["AVX512VL", "AVX512F"]],
5235
+ "_mm_maskz_srl_epi32"=>[["AVX512VL", "AVX512F"]],
5236
+ "_mm_maskz_srli_epi32"=>[["AVX512VL", "AVX512F"]],
5237
5237
  "_mm512_bsrli_epi128"=>["AVX512BW"],
5238
- "_mm256_mask_srl_epi64"=>["AVX512VL", "AVX512F"],
5239
- "_mm256_mask_srli_epi64"=>["AVX512VL", "AVX512F"],
5240
- "_mm256_maskz_srl_epi64"=>["AVX512VL", "AVX512F"],
5241
- "_mm256_maskz_srli_epi64"=>["AVX512VL", "AVX512F"],
5242
- "_mm_mask_srl_epi64"=>["AVX512VL", "AVX512F"],
5243
- "_mm_mask_srli_epi64"=>["AVX512VL", "AVX512F"],
5244
- "_mm_maskz_srl_epi64"=>["AVX512VL", "AVX512F"],
5245
- "_mm_maskz_srli_epi64"=>["AVX512VL", "AVX512F"],
5246
- "_mm256_mask_srlv_epi32"=>["AVX512VL", "AVX512F"],
5247
- "_mm256_maskz_srlv_epi32"=>["AVX512VL", "AVX512F"],
5248
- "_mm_mask_srlv_epi32"=>["AVX512VL", "AVX512F"],
5249
- "_mm_maskz_srlv_epi32"=>["AVX512VL", "AVX512F"],
5250
- "_mm256_mask_srlv_epi64"=>["AVX512VL", "AVX512F"],
5251
- "_mm256_maskz_srlv_epi64"=>["AVX512VL", "AVX512F"],
5252
- "_mm_mask_srlv_epi64"=>["AVX512VL", "AVX512F"],
5253
- "_mm_maskz_srlv_epi64"=>["AVX512VL", "AVX512F"],
5254
- "_mm256_mask_srlv_epi16"=>["AVX512VL", "AVX512BW"],
5255
- "_mm256_maskz_srlv_epi16"=>["AVX512VL", "AVX512BW"],
5256
- "_mm256_srlv_epi16"=>["AVX512VL", "AVX512BW"],
5238
+ "_mm256_mask_srl_epi64"=>[["AVX512VL", "AVX512F"]],
5239
+ "_mm256_mask_srli_epi64"=>[["AVX512VL", "AVX512F"]],
5240
+ "_mm256_maskz_srl_epi64"=>[["AVX512VL", "AVX512F"]],
5241
+ "_mm256_maskz_srli_epi64"=>[["AVX512VL", "AVX512F"]],
5242
+ "_mm_mask_srl_epi64"=>[["AVX512VL", "AVX512F"]],
5243
+ "_mm_mask_srli_epi64"=>[["AVX512VL", "AVX512F"]],
5244
+ "_mm_maskz_srl_epi64"=>[["AVX512VL", "AVX512F"]],
5245
+ "_mm_maskz_srli_epi64"=>[["AVX512VL", "AVX512F"]],
5246
+ "_mm256_mask_srlv_epi32"=>[["AVX512VL", "AVX512F"]],
5247
+ "_mm256_maskz_srlv_epi32"=>[["AVX512VL", "AVX512F"]],
5248
+ "_mm_mask_srlv_epi32"=>[["AVX512VL", "AVX512F"]],
5249
+ "_mm_maskz_srlv_epi32"=>[["AVX512VL", "AVX512F"]],
5250
+ "_mm256_mask_srlv_epi64"=>[["AVX512VL", "AVX512F"]],
5251
+ "_mm256_maskz_srlv_epi64"=>[["AVX512VL", "AVX512F"]],
5252
+ "_mm_mask_srlv_epi64"=>[["AVX512VL", "AVX512F"]],
5253
+ "_mm_maskz_srlv_epi64"=>[["AVX512VL", "AVX512F"]],
5254
+ "_mm256_mask_srlv_epi16"=>[["AVX512VL", "AVX512BW"]],
5255
+ "_mm256_maskz_srlv_epi16"=>[["AVX512VL", "AVX512BW"]],
5256
+ "_mm256_srlv_epi16"=>[["AVX512VL", "AVX512BW"]],
5257
5257
  "_mm512_mask_srlv_epi16"=>["AVX512BW"],
5258
5258
  "_mm512_maskz_srlv_epi16"=>["AVX512BW"],
5259
5259
  "_mm512_srlv_epi16"=>["AVX512BW"],
5260
- "_mm_mask_srlv_epi16"=>["AVX512VL", "AVX512BW"],
5261
- "_mm_maskz_srlv_epi16"=>["AVX512VL", "AVX512BW"],
5262
- "_mm_srlv_epi16"=>["AVX512VL", "AVX512BW"],
5263
- "_mm256_mask_srl_epi16"=>["AVX512VL", "AVX512BW"],
5264
- "_mm256_mask_srli_epi16"=>["AVX512VL", "AVX512BW"],
5265
- "_mm256_maskz_srl_epi16"=>["AVX512VL", "AVX512BW"],
5266
- "_mm256_maskz_srli_epi16"=>["AVX512VL", "AVX512BW"],
5260
+ "_mm_mask_srlv_epi16"=>[["AVX512VL", "AVX512BW"]],
5261
+ "_mm_maskz_srlv_epi16"=>[["AVX512VL", "AVX512BW"]],
5262
+ "_mm_srlv_epi16"=>[["AVX512VL", "AVX512BW"]],
5263
+ "_mm256_mask_srl_epi16"=>[["AVX512VL", "AVX512BW"]],
5264
+ "_mm256_mask_srli_epi16"=>[["AVX512VL", "AVX512BW"]],
5265
+ "_mm256_maskz_srl_epi16"=>[["AVX512VL", "AVX512BW"]],
5266
+ "_mm256_maskz_srli_epi16"=>[["AVX512VL", "AVX512BW"]],
5267
5267
  "_mm512_mask_srl_epi16"=>["AVX512BW"],
5268
5268
  "_mm512_mask_srli_epi16"=>["AVX512BW"],
5269
5269
  "_mm512_maskz_srl_epi16"=>["AVX512BW"],
5270
5270
  "_mm512_maskz_srli_epi16"=>["AVX512BW"],
5271
5271
  "_mm512_srl_epi16"=>["AVX512BW"],
5272
5272
  "_mm512_srli_epi16"=>["AVX512BW"],
5273
- "_mm_mask_srl_epi16"=>["AVX512VL", "AVX512BW"],
5274
- "_mm_mask_srli_epi16"=>["AVX512VL", "AVX512BW"],
5275
- "_mm_maskz_srl_epi16"=>["AVX512VL", "AVX512BW"],
5276
- "_mm_maskz_srli_epi16"=>["AVX512VL", "AVX512BW"],
5277
- "_mm256_mask_sub_epi8"=>["AVX512VL", "AVX512BW"],
5278
- "_mm256_maskz_sub_epi8"=>["AVX512VL", "AVX512BW"],
5273
+ "_mm_mask_srl_epi16"=>[["AVX512VL", "AVX512BW"]],
5274
+ "_mm_mask_srli_epi16"=>[["AVX512VL", "AVX512BW"]],
5275
+ "_mm_maskz_srl_epi16"=>[["AVX512VL", "AVX512BW"]],
5276
+ "_mm_maskz_srli_epi16"=>[["AVX512VL", "AVX512BW"]],
5277
+ "_mm256_mask_sub_epi8"=>[["AVX512VL", "AVX512BW"]],
5278
+ "_mm256_maskz_sub_epi8"=>[["AVX512VL", "AVX512BW"]],
5279
5279
  "_mm512_mask_sub_epi8"=>["AVX512BW"],
5280
5280
  "_mm512_maskz_sub_epi8"=>["AVX512BW"],
5281
5281
  "_mm512_sub_epi8"=>["AVX512BW"],
5282
- "_mm_mask_sub_epi8"=>["AVX512VL", "AVX512BW"],
5283
- "_mm_maskz_sub_epi8"=>["AVX512VL", "AVX512BW"],
5284
- "_mm256_mask_sub_epi32"=>["AVX512VL", "AVX512F"],
5285
- "_mm256_maskz_sub_epi32"=>["AVX512VL", "AVX512F"],
5286
- "_mm_mask_sub_epi32"=>["AVX512VL", "AVX512F"],
5287
- "_mm_maskz_sub_epi32"=>["AVX512VL", "AVX512F"],
5288
- "_mm256_mask_sub_epi64"=>["AVX512VL", "AVX512F"],
5289
- "_mm256_maskz_sub_epi64"=>["AVX512VL", "AVX512F"],
5290
- "_mm_mask_sub_epi64"=>["AVX512VL", "AVX512F"],
5291
- "_mm_maskz_sub_epi64"=>["AVX512VL", "AVX512F"],
5292
- "_mm256_mask_subs_epi8"=>["AVX512VL", "AVX512BW"],
5293
- "_mm256_maskz_subs_epi8"=>["AVX512VL", "AVX512BW"],
5282
+ "_mm_mask_sub_epi8"=>[["AVX512VL", "AVX512BW"]],
5283
+ "_mm_maskz_sub_epi8"=>[["AVX512VL", "AVX512BW"]],
5284
+ "_mm256_mask_sub_epi32"=>[["AVX512VL", "AVX512F"]],
5285
+ "_mm256_maskz_sub_epi32"=>[["AVX512VL", "AVX512F"]],
5286
+ "_mm_mask_sub_epi32"=>[["AVX512VL", "AVX512F"]],
5287
+ "_mm_maskz_sub_epi32"=>[["AVX512VL", "AVX512F"]],
5288
+ "_mm256_mask_sub_epi64"=>[["AVX512VL", "AVX512F"]],
5289
+ "_mm256_maskz_sub_epi64"=>[["AVX512VL", "AVX512F"]],
5290
+ "_mm_mask_sub_epi64"=>[["AVX512VL", "AVX512F"]],
5291
+ "_mm_maskz_sub_epi64"=>[["AVX512VL", "AVX512F"]],
5292
+ "_mm256_mask_subs_epi8"=>[["AVX512VL", "AVX512BW"]],
5293
+ "_mm256_maskz_subs_epi8"=>[["AVX512VL", "AVX512BW"]],
5294
5294
  "_mm512_mask_subs_epi8"=>["AVX512BW"],
5295
5295
  "_mm512_maskz_subs_epi8"=>["AVX512BW"],
5296
5296
  "_mm512_subs_epi8"=>["AVX512BW"],
5297
- "_mm_mask_subs_epi8"=>["AVX512VL", "AVX512BW"],
5298
- "_mm_maskz_subs_epi8"=>["AVX512VL", "AVX512BW"],
5299
- "_mm256_mask_subs_epi16"=>["AVX512VL", "AVX512BW"],
5300
- "_mm256_maskz_subs_epi16"=>["AVX512VL", "AVX512BW"],
5297
+ "_mm_mask_subs_epi8"=>[["AVX512VL", "AVX512BW"]],
5298
+ "_mm_maskz_subs_epi8"=>[["AVX512VL", "AVX512BW"]],
5299
+ "_mm256_mask_subs_epi16"=>[["AVX512VL", "AVX512BW"]],
5300
+ "_mm256_maskz_subs_epi16"=>[["AVX512VL", "AVX512BW"]],
5301
5301
  "_mm512_mask_subs_epi16"=>["AVX512BW"],
5302
5302
  "_mm512_maskz_subs_epi16"=>["AVX512BW"],
5303
5303
  "_mm512_subs_epi16"=>["AVX512BW"],
5304
- "_mm_mask_subs_epi16"=>["AVX512VL", "AVX512BW"],
5305
- "_mm_maskz_subs_epi16"=>["AVX512VL", "AVX512BW"],
5306
- "_mm256_mask_subs_epu8"=>["AVX512VL", "AVX512BW"],
5307
- "_mm256_maskz_subs_epu8"=>["AVX512VL", "AVX512BW"],
5304
+ "_mm_mask_subs_epi16"=>[["AVX512VL", "AVX512BW"]],
5305
+ "_mm_maskz_subs_epi16"=>[["AVX512VL", "AVX512BW"]],
5306
+ "_mm256_mask_subs_epu8"=>[["AVX512VL", "AVX512BW"]],
5307
+ "_mm256_maskz_subs_epu8"=>[["AVX512VL", "AVX512BW"]],
5308
5308
  "_mm512_mask_subs_epu8"=>["AVX512BW"],
5309
5309
  "_mm512_maskz_subs_epu8"=>["AVX512BW"],
5310
5310
  "_mm512_subs_epu8"=>["AVX512BW"],
5311
- "_mm_mask_subs_epu8"=>["AVX512VL", "AVX512BW"],
5312
- "_mm_maskz_subs_epu8"=>["AVX512VL", "AVX512BW"],
5313
- "_mm256_mask_subs_epu16"=>["AVX512VL", "AVX512BW"],
5314
- "_mm256_maskz_subs_epu16"=>["AVX512VL", "AVX512BW"],
5311
+ "_mm_mask_subs_epu8"=>[["AVX512VL", "AVX512BW"]],
5312
+ "_mm_maskz_subs_epu8"=>[["AVX512VL", "AVX512BW"]],
5313
+ "_mm256_mask_subs_epu16"=>[["AVX512VL", "AVX512BW"]],
5314
+ "_mm256_maskz_subs_epu16"=>[["AVX512VL", "AVX512BW"]],
5315
5315
  "_mm512_mask_subs_epu16"=>["AVX512BW"],
5316
5316
  "_mm512_maskz_subs_epu16"=>["AVX512BW"],
5317
5317
  "_mm512_subs_epu16"=>["AVX512BW"],
5318
- "_mm_mask_subs_epu16"=>["AVX512VL", "AVX512BW"],
5319
- "_mm_maskz_subs_epu16"=>["AVX512VL", "AVX512BW"],
5320
- "_mm256_mask_sub_epi16"=>["AVX512VL", "AVX512BW"],
5321
- "_mm256_maskz_sub_epi16"=>["AVX512VL", "AVX512BW"],
5318
+ "_mm_mask_subs_epu16"=>[["AVX512VL", "AVX512BW"]],
5319
+ "_mm_maskz_subs_epu16"=>[["AVX512VL", "AVX512BW"]],
5320
+ "_mm256_mask_sub_epi16"=>[["AVX512VL", "AVX512BW"]],
5321
+ "_mm256_maskz_sub_epi16"=>[["AVX512VL", "AVX512BW"]],
5322
5322
  "_mm512_mask_sub_epi16"=>["AVX512BW"],
5323
5323
  "_mm512_maskz_sub_epi16"=>["AVX512BW"],
5324
5324
  "_mm512_sub_epi16"=>["AVX512BW"],
5325
- "_mm_mask_sub_epi16"=>["AVX512VL", "AVX512BW"],
5326
- "_mm_maskz_sub_epi16"=>["AVX512VL", "AVX512BW"],
5327
- "_mm256_mask_ternarylogic_epi32"=>["AVX512VL", "AVX512F"],
5328
- "_mm256_maskz_ternarylogic_epi32"=>["AVX512VL", "AVX512F"],
5329
- "_mm256_ternarylogic_epi32"=>["AVX512VL", "AVX512F"],
5330
- "_mm_mask_ternarylogic_epi32"=>["AVX512VL", "AVX512F"],
5331
- "_mm_maskz_ternarylogic_epi32"=>["AVX512VL", "AVX512F"],
5332
- "_mm_ternarylogic_epi32"=>["AVX512VL", "AVX512F"],
5333
- "_mm256_mask_ternarylogic_epi64"=>["AVX512VL", "AVX512F"],
5334
- "_mm256_maskz_ternarylogic_epi64"=>["AVX512VL", "AVX512F"],
5335
- "_mm256_ternarylogic_epi64"=>["AVX512VL", "AVX512F"],
5336
- "_mm_mask_ternarylogic_epi64"=>["AVX512VL", "AVX512F"],
5337
- "_mm_maskz_ternarylogic_epi64"=>["AVX512VL", "AVX512F"],
5338
- "_mm_ternarylogic_epi64"=>["AVX512VL", "AVX512F"],
5339
- "_mm256_mask_test_epi8_mask"=>["AVX512VL", "AVX512BW"],
5340
- "_mm256_test_epi8_mask"=>["AVX512VL", "AVX512BW"],
5325
+ "_mm_mask_sub_epi16"=>[["AVX512VL", "AVX512BW"]],
5326
+ "_mm_maskz_sub_epi16"=>[["AVX512VL", "AVX512BW"]],
5327
+ "_mm256_mask_ternarylogic_epi32"=>[["AVX512VL", "AVX512F"]],
5328
+ "_mm256_maskz_ternarylogic_epi32"=>[["AVX512VL", "AVX512F"]],
5329
+ "_mm256_ternarylogic_epi32"=>[["AVX512VL", "AVX512F"]],
5330
+ "_mm_mask_ternarylogic_epi32"=>[["AVX512VL", "AVX512F"]],
5331
+ "_mm_maskz_ternarylogic_epi32"=>[["AVX512VL", "AVX512F"]],
5332
+ "_mm_ternarylogic_epi32"=>[["AVX512VL", "AVX512F"]],
5333
+ "_mm256_mask_ternarylogic_epi64"=>[["AVX512VL", "AVX512F"]],
5334
+ "_mm256_maskz_ternarylogic_epi64"=>[["AVX512VL", "AVX512F"]],
5335
+ "_mm256_ternarylogic_epi64"=>[["AVX512VL", "AVX512F"]],
5336
+ "_mm_mask_ternarylogic_epi64"=>[["AVX512VL", "AVX512F"]],
5337
+ "_mm_maskz_ternarylogic_epi64"=>[["AVX512VL", "AVX512F"]],
5338
+ "_mm_ternarylogic_epi64"=>[["AVX512VL", "AVX512F"]],
5339
+ "_mm256_mask_test_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5340
+ "_mm256_test_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5341
5341
  "_mm512_mask_test_epi8_mask"=>["AVX512BW"],
5342
5342
  "_mm512_test_epi8_mask"=>["AVX512BW"],
5343
- "_mm_mask_test_epi8_mask"=>["AVX512VL", "AVX512BW"],
5344
- "_mm_test_epi8_mask"=>["AVX512VL", "AVX512BW"],
5345
- "_mm256_mask_test_epi32_mask"=>["AVX512VL", "AVX512F"],
5346
- "_mm256_test_epi32_mask"=>["AVX512VL", "AVX512F"],
5347
- "_mm_mask_test_epi32_mask"=>["AVX512VL", "AVX512F"],
5348
- "_mm_test_epi32_mask"=>["AVX512VL", "AVX512F"],
5349
- "_mm256_mask_test_epi64_mask"=>["AVX512VL", "AVX512F"],
5350
- "_mm256_test_epi64_mask"=>["AVX512VL", "AVX512F"],
5351
- "_mm_mask_test_epi64_mask"=>["AVX512VL", "AVX512F"],
5352
- "_mm_test_epi64_mask"=>["AVX512VL", "AVX512F"],
5353
- "_mm256_mask_test_epi16_mask"=>["AVX512VL", "AVX512BW"],
5354
- "_mm256_test_epi16_mask"=>["AVX512VL", "AVX512BW"],
5343
+ "_mm_mask_test_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5344
+ "_mm_test_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5345
+ "_mm256_mask_test_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5346
+ "_mm256_test_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5347
+ "_mm_mask_test_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5348
+ "_mm_test_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5349
+ "_mm256_mask_test_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5350
+ "_mm256_test_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5351
+ "_mm_mask_test_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5352
+ "_mm_test_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5353
+ "_mm256_mask_test_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5354
+ "_mm256_test_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5355
5355
  "_mm512_mask_test_epi16_mask"=>["AVX512BW"],
5356
5356
  "_mm512_test_epi16_mask"=>["AVX512BW"],
5357
- "_mm_mask_test_epi16_mask"=>["AVX512VL", "AVX512BW"],
5358
- "_mm_test_epi16_mask"=>["AVX512VL", "AVX512BW"],
5359
- "_mm256_mask_testn_epi8_mask"=>["AVX512VL", "AVX512BW"],
5360
- "_mm256_testn_epi8_mask"=>["AVX512VL", "AVX512BW"],
5357
+ "_mm_mask_test_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5358
+ "_mm_test_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5359
+ "_mm256_mask_testn_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5360
+ "_mm256_testn_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5361
5361
  "_mm512_mask_testn_epi8_mask"=>["AVX512BW"],
5362
5362
  "_mm512_testn_epi8_mask"=>["AVX512BW"],
5363
- "_mm_mask_testn_epi8_mask"=>["AVX512VL", "AVX512BW"],
5364
- "_mm_testn_epi8_mask"=>["AVX512VL", "AVX512BW"],
5365
- "_mm256_mask_testn_epi32_mask"=>["AVX512VL", "AVX512F"],
5366
- "_mm256_testn_epi32_mask"=>["AVX512VL", "AVX512F"],
5367
- "_mm_mask_testn_epi32_mask"=>["AVX512VL", "AVX512F"],
5368
- "_mm_testn_epi32_mask"=>["AVX512VL", "AVX512F"],
5369
- "_mm256_mask_testn_epi64_mask"=>["AVX512VL", "AVX512F"],
5370
- "_mm256_testn_epi64_mask"=>["AVX512VL", "AVX512F"],
5371
- "_mm_mask_testn_epi64_mask"=>["AVX512VL", "AVX512F"],
5372
- "_mm_testn_epi64_mask"=>["AVX512VL", "AVX512F"],
5373
- "_mm256_mask_testn_epi16_mask"=>["AVX512VL", "AVX512BW"],
5374
- "_mm256_testn_epi16_mask"=>["AVX512VL", "AVX512BW"],
5363
+ "_mm_mask_testn_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5364
+ "_mm_testn_epi8_mask"=>[["AVX512VL", "AVX512BW"]],
5365
+ "_mm256_mask_testn_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5366
+ "_mm256_testn_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5367
+ "_mm_mask_testn_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5368
+ "_mm_testn_epi32_mask"=>[["AVX512VL", "AVX512F"]],
5369
+ "_mm256_mask_testn_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5370
+ "_mm256_testn_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5371
+ "_mm_mask_testn_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5372
+ "_mm_testn_epi64_mask"=>[["AVX512VL", "AVX512F"]],
5373
+ "_mm256_mask_testn_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5374
+ "_mm256_testn_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5375
5375
  "_mm512_mask_testn_epi16_mask"=>["AVX512BW"],
5376
5376
  "_mm512_testn_epi16_mask"=>["AVX512BW"],
5377
- "_mm_mask_testn_epi16_mask"=>["AVX512VL", "AVX512BW"],
5378
- "_mm_testn_epi16_mask"=>["AVX512VL", "AVX512BW"],
5379
- "_mm256_mask_unpackhi_epi8"=>["AVX512VL", "AVX512BW"],
5380
- "_mm256_maskz_unpackhi_epi8"=>["AVX512VL", "AVX512BW"],
5377
+ "_mm_mask_testn_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5378
+ "_mm_testn_epi16_mask"=>[["AVX512VL", "AVX512BW"]],
5379
+ "_mm256_mask_unpackhi_epi8"=>[["AVX512VL", "AVX512BW"]],
5380
+ "_mm256_maskz_unpackhi_epi8"=>[["AVX512VL", "AVX512BW"]],
5381
5381
  "_mm512_mask_unpackhi_epi8"=>["AVX512BW"],
5382
5382
  "_mm512_maskz_unpackhi_epi8"=>["AVX512BW"],
5383
5383
  "_mm512_unpackhi_epi8"=>["AVX512BW"],
5384
- "_mm_mask_unpackhi_epi8"=>["AVX512VL", "AVX512BW"],
5385
- "_mm_maskz_unpackhi_epi8"=>["AVX512VL", "AVX512BW"],
5386
- "_mm256_mask_unpackhi_epi32"=>["AVX512VL", "AVX512F"],
5387
- "_mm256_maskz_unpackhi_epi32"=>["AVX512VL", "AVX512F"],
5388
- "_mm_mask_unpackhi_epi32"=>["AVX512VL", "AVX512F"],
5389
- "_mm_maskz_unpackhi_epi32"=>["AVX512VL", "AVX512F"],
5390
- "_mm256_mask_unpackhi_epi64"=>["AVX512VL", "AVX512F"],
5391
- "_mm256_maskz_unpackhi_epi64"=>["AVX512VL", "AVX512F"],
5392
- "_mm_mask_unpackhi_epi64"=>["AVX512VL", "AVX512F"],
5393
- "_mm_maskz_unpackhi_epi64"=>["AVX512VL", "AVX512F"],
5394
- "_mm256_mask_unpackhi_epi16"=>["AVX512VL", "AVX512BW"],
5395
- "_mm256_maskz_unpackhi_epi16"=>["AVX512VL", "AVX512BW"],
5384
+ "_mm_mask_unpackhi_epi8"=>[["AVX512VL", "AVX512BW"]],
5385
+ "_mm_maskz_unpackhi_epi8"=>[["AVX512VL", "AVX512BW"]],
5386
+ "_mm256_mask_unpackhi_epi32"=>[["AVX512VL", "AVX512F"]],
5387
+ "_mm256_maskz_unpackhi_epi32"=>[["AVX512VL", "AVX512F"]],
5388
+ "_mm_mask_unpackhi_epi32"=>[["AVX512VL", "AVX512F"]],
5389
+ "_mm_maskz_unpackhi_epi32"=>[["AVX512VL", "AVX512F"]],
5390
+ "_mm256_mask_unpackhi_epi64"=>[["AVX512VL", "AVX512F"]],
5391
+ "_mm256_maskz_unpackhi_epi64"=>[["AVX512VL", "AVX512F"]],
5392
+ "_mm_mask_unpackhi_epi64"=>[["AVX512VL", "AVX512F"]],
5393
+ "_mm_maskz_unpackhi_epi64"=>[["AVX512VL", "AVX512F"]],
5394
+ "_mm256_mask_unpackhi_epi16"=>[["AVX512VL", "AVX512BW"]],
5395
+ "_mm256_maskz_unpackhi_epi16"=>[["AVX512VL", "AVX512BW"]],
5396
5396
  "_mm512_mask_unpackhi_epi16"=>["AVX512BW"],
5397
5397
  "_mm512_maskz_unpackhi_epi16"=>["AVX512BW"],
5398
5398
  "_mm512_unpackhi_epi16"=>["AVX512BW"],
5399
- "_mm_mask_unpackhi_epi16"=>["AVX512VL", "AVX512BW"],
5400
- "_mm_maskz_unpackhi_epi16"=>["AVX512VL", "AVX512BW"],
5401
- "_mm256_mask_unpacklo_epi8"=>["AVX512VL", "AVX512BW"],
5402
- "_mm256_maskz_unpacklo_epi8"=>["AVX512VL", "AVX512BW"],
5399
+ "_mm_mask_unpackhi_epi16"=>[["AVX512VL", "AVX512BW"]],
5400
+ "_mm_maskz_unpackhi_epi16"=>[["AVX512VL", "AVX512BW"]],
5401
+ "_mm256_mask_unpacklo_epi8"=>[["AVX512VL", "AVX512BW"]],
5402
+ "_mm256_maskz_unpacklo_epi8"=>[["AVX512VL", "AVX512BW"]],
5403
5403
  "_mm512_mask_unpacklo_epi8"=>["AVX512BW"],
5404
5404
  "_mm512_maskz_unpacklo_epi8"=>["AVX512BW"],
5405
5405
  "_mm512_unpacklo_epi8"=>["AVX512BW"],
5406
- "_mm_mask_unpacklo_epi8"=>["AVX512VL", "AVX512BW"],
5407
- "_mm_maskz_unpacklo_epi8"=>["AVX512VL", "AVX512BW"],
5408
- "_mm256_mask_unpacklo_epi32"=>["AVX512VL", "AVX512F"],
5409
- "_mm256_maskz_unpacklo_epi32"=>["AVX512VL", "AVX512F"],
5410
- "_mm_mask_unpacklo_epi32"=>["AVX512VL", "AVX512F"],
5411
- "_mm_maskz_unpacklo_epi32"=>["AVX512VL", "AVX512F"],
5412
- "_mm256_mask_unpacklo_epi64"=>["AVX512VL", "AVX512F"],
5413
- "_mm256_maskz_unpacklo_epi64"=>["AVX512VL", "AVX512F"],
5414
- "_mm_mask_unpacklo_epi64"=>["AVX512VL", "AVX512F"],
5415
- "_mm_maskz_unpacklo_epi64"=>["AVX512VL", "AVX512F"],
5416
- "_mm256_mask_unpacklo_epi16"=>["AVX512VL", "AVX512BW"],
5417
- "_mm256_maskz_unpacklo_epi16"=>["AVX512VL", "AVX512BW"],
5406
+ "_mm_mask_unpacklo_epi8"=>[["AVX512VL", "AVX512BW"]],
5407
+ "_mm_maskz_unpacklo_epi8"=>[["AVX512VL", "AVX512BW"]],
5408
+ "_mm256_mask_unpacklo_epi32"=>[["AVX512VL", "AVX512F"]],
5409
+ "_mm256_maskz_unpacklo_epi32"=>[["AVX512VL", "AVX512F"]],
5410
+ "_mm_mask_unpacklo_epi32"=>[["AVX512VL", "AVX512F"]],
5411
+ "_mm_maskz_unpacklo_epi32"=>[["AVX512VL", "AVX512F"]],
5412
+ "_mm256_mask_unpacklo_epi64"=>[["AVX512VL", "AVX512F"]],
5413
+ "_mm256_maskz_unpacklo_epi64"=>[["AVX512VL", "AVX512F"]],
5414
+ "_mm_mask_unpacklo_epi64"=>[["AVX512VL", "AVX512F"]],
5415
+ "_mm_maskz_unpacklo_epi64"=>[["AVX512VL", "AVX512F"]],
5416
+ "_mm256_mask_unpacklo_epi16"=>[["AVX512VL", "AVX512BW"]],
5417
+ "_mm256_maskz_unpacklo_epi16"=>[["AVX512VL", "AVX512BW"]],
5418
5418
  "_mm512_mask_unpacklo_epi16"=>["AVX512BW"],
5419
5419
  "_mm512_maskz_unpacklo_epi16"=>["AVX512BW"],
5420
5420
  "_mm512_unpacklo_epi16"=>["AVX512BW"],
5421
- "_mm_mask_unpacklo_epi16"=>["AVX512VL", "AVX512BW"],
5422
- "_mm_maskz_unpacklo_epi16"=>["AVX512VL", "AVX512BW"],
5423
- "_mm256_mask_xor_epi32"=>["AVX512VL", "AVX512F"],
5424
- "_mm256_maskz_xor_epi32"=>["AVX512VL", "AVX512F"],
5425
- "_mm_mask_xor_epi32"=>["AVX512VL", "AVX512F"],
5426
- "_mm_maskz_xor_epi32"=>["AVX512VL", "AVX512F"],
5427
- "_mm256_mask_xor_epi64"=>["AVX512VL", "AVX512F"],
5428
- "_mm256_maskz_xor_epi64"=>["AVX512VL", "AVX512F"],
5429
- "_mm_mask_xor_epi64"=>["AVX512VL", "AVX512F"],
5430
- "_mm_maskz_xor_epi64"=>["AVX512VL", "AVX512F"],
5431
- "_mm256_mask_range_pd"=>["AVX512VL", "AVX512DQ"],
5432
- "_mm256_maskz_range_pd"=>["AVX512VL", "AVX512DQ"],
5433
- "_mm256_range_pd"=>["AVX512VL", "AVX512DQ"],
5421
+ "_mm_mask_unpacklo_epi16"=>[["AVX512VL", "AVX512BW"]],
5422
+ "_mm_maskz_unpacklo_epi16"=>[["AVX512VL", "AVX512BW"]],
5423
+ "_mm256_mask_xor_epi32"=>[["AVX512VL", "AVX512F"]],
5424
+ "_mm256_maskz_xor_epi32"=>[["AVX512VL", "AVX512F"]],
5425
+ "_mm_mask_xor_epi32"=>[["AVX512VL", "AVX512F"]],
5426
+ "_mm_maskz_xor_epi32"=>[["AVX512VL", "AVX512F"]],
5427
+ "_mm256_mask_xor_epi64"=>[["AVX512VL", "AVX512F"]],
5428
+ "_mm256_maskz_xor_epi64"=>[["AVX512VL", "AVX512F"]],
5429
+ "_mm_mask_xor_epi64"=>[["AVX512VL", "AVX512F"]],
5430
+ "_mm_maskz_xor_epi64"=>[["AVX512VL", "AVX512F"]],
5431
+ "_mm256_mask_range_pd"=>[["AVX512VL", "AVX512DQ"]],
5432
+ "_mm256_maskz_range_pd"=>[["AVX512VL", "AVX512DQ"]],
5433
+ "_mm256_range_pd"=>[["AVX512VL", "AVX512DQ"]],
5434
5434
  "_mm512_mask_range_pd"=>["AVX512DQ"],
5435
5435
  "_mm512_mask_range_round_pd"=>["AVX512DQ"],
5436
5436
  "_mm512_maskz_range_pd"=>["AVX512DQ"],
5437
5437
  "_mm512_maskz_range_round_pd"=>["AVX512DQ"],
5438
5438
  "_mm512_range_pd"=>["AVX512DQ"],
5439
5439
  "_mm512_range_round_pd"=>["AVX512DQ"],
5440
- "_mm_mask_range_pd"=>["AVX512VL", "AVX512DQ"],
5441
- "_mm_maskz_range_pd"=>["AVX512VL", "AVX512DQ"],
5442
- "_mm_range_pd"=>["AVX512VL", "AVX512DQ"],
5443
- "_mm256_mask_range_ps"=>["AVX512VL", "AVX512DQ"],
5444
- "_mm256_maskz_range_ps"=>["AVX512VL", "AVX512DQ"],
5445
- "_mm256_range_ps"=>["AVX512VL", "AVX512DQ"],
5440
+ "_mm_mask_range_pd"=>[["AVX512VL", "AVX512DQ"]],
5441
+ "_mm_maskz_range_pd"=>[["AVX512VL", "AVX512DQ"]],
5442
+ "_mm_range_pd"=>[["AVX512VL", "AVX512DQ"]],
5443
+ "_mm256_mask_range_ps"=>[["AVX512VL", "AVX512DQ"]],
5444
+ "_mm256_maskz_range_ps"=>[["AVX512VL", "AVX512DQ"]],
5445
+ "_mm256_range_ps"=>[["AVX512VL", "AVX512DQ"]],
5446
5446
  "_mm512_mask_range_ps"=>["AVX512DQ"],
5447
5447
  "_mm512_mask_range_round_ps"=>["AVX512DQ"],
5448
5448
  "_mm512_maskz_range_ps"=>["AVX512DQ"],
5449
5449
  "_mm512_maskz_range_round_ps"=>["AVX512DQ"],
5450
5450
  "_mm512_range_ps"=>["AVX512DQ"],
5451
5451
  "_mm512_range_round_ps"=>["AVX512DQ"],
5452
- "_mm_mask_range_ps"=>["AVX512VL", "AVX512DQ"],
5453
- "_mm_maskz_range_ps"=>["AVX512VL", "AVX512DQ"],
5454
- "_mm_range_ps"=>["AVX512VL", "AVX512DQ"],
5452
+ "_mm_mask_range_ps"=>[["AVX512VL", "AVX512DQ"]],
5453
+ "_mm_maskz_range_ps"=>[["AVX512VL", "AVX512DQ"]],
5454
+ "_mm_range_ps"=>[["AVX512VL", "AVX512DQ"]],
5455
5455
  "_mm_mask_range_round_sd"=>["AVX512DQ"],
5456
5456
  "_mm_mask_range_sd"=>["AVX512DQ"],
5457
5457
  "_mm_maskz_range_round_sd"=>["AVX512DQ"],
@@ -5462,42 +5462,42 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
5462
5462
  "_mm_maskz_range_round_ss"=>["AVX512DQ"],
5463
5463
  "_mm_maskz_range_ss"=>["AVX512DQ"],
5464
5464
  "_mm_range_round_ss"=>["AVX512DQ"],
5465
- "_mm256_mask_rcp14_pd"=>["AVX512VL", "AVX512F"],
5466
- "_mm256_maskz_rcp14_pd"=>["AVX512VL", "AVX512F"],
5467
- "_mm256_rcp14_pd"=>["AVX512VL", "AVX512F"],
5468
- "_mm_mask_rcp14_pd"=>["AVX512VL", "AVX512F"],
5469
- "_mm_maskz_rcp14_pd"=>["AVX512VL", "AVX512F"],
5470
- "_mm_rcp14_pd"=>["AVX512VL", "AVX512F"],
5471
- "_mm256_mask_rcp14_ps"=>["AVX512VL", "AVX512F"],
5472
- "_mm256_maskz_rcp14_ps"=>["AVX512VL", "AVX512F"],
5473
- "_mm256_rcp14_ps"=>["AVX512VL", "AVX512F"],
5474
- "_mm_mask_rcp14_ps"=>["AVX512VL", "AVX512F"],
5475
- "_mm_maskz_rcp14_ps"=>["AVX512VL", "AVX512F"],
5476
- "_mm_rcp14_ps"=>["AVX512VL", "AVX512F"],
5477
- "_mm256_mask_reduce_pd"=>["AVX512VL", "AVX512DQ"],
5478
- "_mm256_maskz_reduce_pd"=>["AVX512VL", "AVX512DQ"],
5479
- "_mm256_reduce_pd"=>["AVX512VL", "AVX512DQ"],
5465
+ "_mm256_mask_rcp14_pd"=>[["AVX512VL", "AVX512F"]],
5466
+ "_mm256_maskz_rcp14_pd"=>[["AVX512VL", "AVX512F"]],
5467
+ "_mm256_rcp14_pd"=>[["AVX512VL", "AVX512F"]],
5468
+ "_mm_mask_rcp14_pd"=>[["AVX512VL", "AVX512F"]],
5469
+ "_mm_maskz_rcp14_pd"=>[["AVX512VL", "AVX512F"]],
5470
+ "_mm_rcp14_pd"=>[["AVX512VL", "AVX512F"]],
5471
+ "_mm256_mask_rcp14_ps"=>[["AVX512VL", "AVX512F"]],
5472
+ "_mm256_maskz_rcp14_ps"=>[["AVX512VL", "AVX512F"]],
5473
+ "_mm256_rcp14_ps"=>[["AVX512VL", "AVX512F"]],
5474
+ "_mm_mask_rcp14_ps"=>[["AVX512VL", "AVX512F"]],
5475
+ "_mm_maskz_rcp14_ps"=>[["AVX512VL", "AVX512F"]],
5476
+ "_mm_rcp14_ps"=>[["AVX512VL", "AVX512F"]],
5477
+ "_mm256_mask_reduce_pd"=>[["AVX512VL", "AVX512DQ"]],
5478
+ "_mm256_maskz_reduce_pd"=>[["AVX512VL", "AVX512DQ"]],
5479
+ "_mm256_reduce_pd"=>[["AVX512VL", "AVX512DQ"]],
5480
5480
  "_mm512_mask_reduce_pd"=>["AVX512DQ"],
5481
5481
  "_mm512_mask_reduce_round_pd"=>["AVX512DQ"],
5482
5482
  "_mm512_maskz_reduce_pd"=>["AVX512DQ"],
5483
5483
  "_mm512_maskz_reduce_round_pd"=>["AVX512DQ"],
5484
5484
  "_mm512_reduce_pd"=>["AVX512DQ"],
5485
5485
  "_mm512_reduce_round_pd"=>["AVX512DQ"],
5486
- "_mm_mask_reduce_pd"=>["AVX512VL", "AVX512DQ"],
5487
- "_mm_maskz_reduce_pd"=>["AVX512VL", "AVX512DQ"],
5488
- "_mm_reduce_pd"=>["AVX512VL", "AVX512DQ"],
5489
- "_mm256_mask_reduce_ps"=>["AVX512VL", "AVX512DQ"],
5490
- "_mm256_maskz_reduce_ps"=>["AVX512VL", "AVX512DQ"],
5491
- "_mm256_reduce_ps"=>["AVX512VL", "AVX512DQ"],
5486
+ "_mm_mask_reduce_pd"=>[["AVX512VL", "AVX512DQ"]],
5487
+ "_mm_maskz_reduce_pd"=>[["AVX512VL", "AVX512DQ"]],
5488
+ "_mm_reduce_pd"=>[["AVX512VL", "AVX512DQ"]],
5489
+ "_mm256_mask_reduce_ps"=>[["AVX512VL", "AVX512DQ"]],
5490
+ "_mm256_maskz_reduce_ps"=>[["AVX512VL", "AVX512DQ"]],
5491
+ "_mm256_reduce_ps"=>[["AVX512VL", "AVX512DQ"]],
5492
5492
  "_mm512_mask_reduce_ps"=>["AVX512DQ"],
5493
5493
  "_mm512_mask_reduce_round_ps"=>["AVX512DQ"],
5494
5494
  "_mm512_maskz_reduce_ps"=>["AVX512DQ"],
5495
5495
  "_mm512_maskz_reduce_round_ps"=>["AVX512DQ"],
5496
5496
  "_mm512_reduce_ps"=>["AVX512DQ"],
5497
5497
  "_mm512_reduce_round_ps"=>["AVX512DQ"],
5498
- "_mm_mask_reduce_ps"=>["AVX512VL", "AVX512DQ"],
5499
- "_mm_maskz_reduce_ps"=>["AVX512VL", "AVX512DQ"],
5500
- "_mm_reduce_ps"=>["AVX512VL", "AVX512DQ"],
5498
+ "_mm_mask_reduce_ps"=>[["AVX512VL", "AVX512DQ"]],
5499
+ "_mm_maskz_reduce_ps"=>[["AVX512VL", "AVX512DQ"]],
5500
+ "_mm_reduce_ps"=>[["AVX512VL", "AVX512DQ"]],
5501
5501
  "_mm_mask_reduce_sd"=>["AVX512DQ"],
5502
5502
  "_mm_mask_reduce_round_sd"=>["AVX512DQ"],
5503
5503
  "_mm_maskz_reduce_sd"=>["AVX512DQ"],
@@ -5510,167 +5510,167 @@ X86CPUID_by_name ={"_m_from_int64"=>["MMX"],
5510
5510
  "_mm_maskz_reduce_round_ss"=>["AVX512DQ"],
5511
5511
  "_mm_reduce_ss"=>["AVX512DQ"],
5512
5512
  "_mm_reduce_round_ss"=>["AVX512DQ"],
5513
- "_mm256_mask_roundscale_pd"=>["AVX512VL", "AVX512F"],
5514
- "_mm256_maskz_roundscale_pd"=>["AVX512VL", "AVX512F"],
5515
- "_mm256_roundscale_pd"=>["AVX512VL", "AVX512F"],
5516
- "_mm_mask_roundscale_pd"=>["AVX512VL", "AVX512F"],
5517
- "_mm_maskz_roundscale_pd"=>["AVX512VL", "AVX512F"],
5518
- "_mm_roundscale_pd"=>["AVX512VL", "AVX512F"],
5519
- "_mm256_mask_roundscale_ps"=>["AVX512VL", "AVX512F"],
5520
- "_mm256_maskz_roundscale_ps"=>["AVX512VL", "AVX512F"],
5521
- "_mm256_roundscale_ps"=>["AVX512VL", "AVX512F"],
5522
- "_mm_mask_roundscale_ps"=>["AVX512VL", "AVX512F"],
5523
- "_mm_maskz_roundscale_ps"=>["AVX512VL", "AVX512F"],
5524
- "_mm_roundscale_ps"=>["AVX512VL", "AVX512F"],
5525
- "_mm256_mask_rsqrt14_pd"=>["AVX512VL", "AVX512F"],
5526
- "_mm256_maskz_rsqrt14_pd"=>["AVX512VL", "AVX512F"],
5527
- "_mm_mask_rsqrt14_pd"=>["AVX512VL", "AVX512F"],
5528
- "_mm_maskz_rsqrt14_pd"=>["AVX512VL", "AVX512F"],
5529
- "_mm256_mask_rsqrt14_ps"=>["AVX512VL", "AVX512F"],
5530
- "_mm256_maskz_rsqrt14_ps"=>["AVX512VL", "AVX512F"],
5531
- "_mm_mask_rsqrt14_ps"=>["AVX512VL", "AVX512F"],
5532
- "_mm_maskz_rsqrt14_ps"=>["AVX512VL", "AVX512F"],
5533
- "_mm256_mask_scalef_pd"=>["AVX512VL", "AVX512F"],
5534
- "_mm256_maskz_scalef_pd"=>["AVX512VL", "AVX512F"],
5535
- "_mm256_scalef_pd"=>["AVX512VL", "AVX512F"],
5536
- "_mm_mask_scalef_pd"=>["AVX512VL", "AVX512F"],
5537
- "_mm_maskz_scalef_pd"=>["AVX512VL", "AVX512F"],
5538
- "_mm_scalef_pd"=>["AVX512VL", "AVX512F"],
5539
- "_mm256_mask_scalef_ps"=>["AVX512VL", "AVX512F"],
5540
- "_mm256_maskz_scalef_ps"=>["AVX512VL", "AVX512F"],
5541
- "_mm256_scalef_ps"=>["AVX512VL", "AVX512F"],
5542
- "_mm_mask_scalef_ps"=>["AVX512VL", "AVX512F"],
5543
- "_mm_maskz_scalef_ps"=>["AVX512VL", "AVX512F"],
5544
- "_mm_scalef_ps"=>["AVX512VL", "AVX512F"],
5545
- "_mm256_i32scatter_pd"=>["AVX512VL", "AVX512F"],
5546
- "_mm256_mask_i32scatter_pd"=>["AVX512VL", "AVX512F"],
5547
- "_mm_i32scatter_pd"=>["AVX512VL", "AVX512F"],
5548
- "_mm_mask_i32scatter_pd"=>["AVX512VL", "AVX512F"],
5549
- "_mm256_i32scatter_ps"=>["AVX512VL", "AVX512F"],
5550
- "_mm256_mask_i32scatter_ps"=>["AVX512VL", "AVX512F"],
5551
- "_mm_i32scatter_ps"=>["AVX512VL", "AVX512F"],
5552
- "_mm_mask_i32scatter_ps"=>["AVX512VL", "AVX512F"],
5553
- "_mm256_i64scatter_pd"=>["AVX512VL", "AVX512F"],
5554
- "_mm256_mask_i64scatter_pd"=>["AVX512VL", "AVX512F"],
5555
- "_mm_i64scatter_pd"=>["AVX512VL", "AVX512F"],
5556
- "_mm_mask_i64scatter_pd"=>["AVX512VL", "AVX512F"],
5557
- "_mm256_i64scatter_ps"=>["AVX512VL", "AVX512F"],
5558
- "_mm256_mask_i64scatter_ps"=>["AVX512VL", "AVX512F"],
5559
- "_mm_i64scatter_ps"=>["AVX512VL", "AVX512F"],
5560
- "_mm_mask_i64scatter_ps"=>["AVX512VL", "AVX512F"],
5561
- "_mm256_mask_shuffle_f32x4"=>["AVX512VL", "AVX512F"],
5562
- "_mm256_maskz_shuffle_f32x4"=>["AVX512VL", "AVX512F"],
5563
- "_mm256_shuffle_f32x4"=>["AVX512VL", "AVX512F"],
5564
- "_mm256_mask_shuffle_f64x2"=>["AVX512VL", "AVX512F"],
5565
- "_mm256_maskz_shuffle_f64x2"=>["AVX512VL", "AVX512F"],
5566
- "_mm256_shuffle_f64x2"=>["AVX512VL", "AVX512F"],
5567
- "_mm256_mask_shuffle_i32x4"=>["AVX512VL", "AVX512F"],
5568
- "_mm256_maskz_shuffle_i32x4"=>["AVX512VL", "AVX512F"],
5569
- "_mm256_shuffle_i32x4"=>["AVX512VL", "AVX512F"],
5570
- "_mm256_mask_shuffle_i64x2"=>["AVX512VL", "AVX512F"],
5571
- "_mm256_maskz_shuffle_i64x2"=>["AVX512VL", "AVX512F"],
5572
- "_mm256_shuffle_i64x2"=>["AVX512VL", "AVX512F"],
5573
- "_mm256_mask_shuffle_pd"=>["AVX512VL", "AVX512F"],
5574
- "_mm256_maskz_shuffle_pd"=>["AVX512VL", "AVX512F"],
5575
- "_mm_mask_shuffle_pd"=>["AVX512VL", "AVX512F"],
5576
- "_mm_maskz_shuffle_pd"=>["AVX512VL", "AVX512F"],
5577
- "_mm256_mask_shuffle_ps"=>["AVX512VL", "AVX512F"],
5578
- "_mm256_maskz_shuffle_ps"=>["AVX512VL", "AVX512F"],
5579
- "_mm_mask_shuffle_ps"=>["AVX512VL", "AVX512F"],
5580
- "_mm_maskz_shuffle_ps"=>["AVX512VL", "AVX512F"],
5581
- "_mm256_mask_sqrt_pd"=>["AVX512VL", "AVX512F"],
5582
- "_mm256_maskz_sqrt_pd"=>["AVX512VL", "AVX512F"],
5583
- "_mm_mask_sqrt_pd"=>["AVX512VL", "AVX512F"],
5584
- "_mm_maskz_sqrt_pd"=>["AVX512VL", "AVX512F"],
5585
- "_mm256_mask_sqrt_ps"=>["AVX512VL", "AVX512F"],
5586
- "_mm256_maskz_sqrt_ps"=>["AVX512VL", "AVX512F"],
5587
- "_mm_mask_sqrt_ps"=>["AVX512VL", "AVX512F"],
5588
- "_mm_maskz_sqrt_ps"=>["AVX512VL", "AVX512F"],
5589
- "_mm256_mask_sub_pd"=>["AVX512VL", "AVX512F"],
5590
- "_mm256_maskz_sub_pd"=>["AVX512VL", "AVX512F"],
5591
- "_mm_mask_sub_pd"=>["AVX512VL", "AVX512F"],
5592
- "_mm_maskz_sub_pd"=>["AVX512VL", "AVX512F"],
5593
- "_mm256_mask_sub_ps"=>["AVX512VL", "AVX512F"],
5594
- "_mm256_maskz_sub_ps"=>["AVX512VL", "AVX512F"],
5595
- "_mm_mask_sub_ps"=>["AVX512VL", "AVX512F"],
5596
- "_mm_maskz_sub_ps"=>["AVX512VL", "AVX512F"],
5597
- "_mm256_mask_unpackhi_pd"=>["AVX512VL", "AVX512F"],
5598
- "_mm256_maskz_unpackhi_pd"=>["AVX512VL", "AVX512F"],
5599
- "_mm_mask_unpackhi_pd"=>["AVX512VL", "AVX512F"],
5600
- "_mm_maskz_unpackhi_pd"=>["AVX512VL", "AVX512F"],
5601
- "_mm256_mask_unpackhi_ps"=>["AVX512VL", "AVX512F"],
5602
- "_mm256_maskz_unpackhi_ps"=>["AVX512VL", "AVX512F"],
5603
- "_mm_mask_unpackhi_ps"=>["AVX512VL", "AVX512F"],
5604
- "_mm_maskz_unpackhi_ps"=>["AVX512VL", "AVX512F"],
5605
- "_mm256_mask_unpacklo_pd"=>["AVX512VL", "AVX512F"],
5606
- "_mm256_maskz_unpacklo_pd"=>["AVX512VL", "AVX512F"],
5607
- "_mm_mask_unpacklo_pd"=>["AVX512VL", "AVX512F"],
5608
- "_mm_maskz_unpacklo_pd"=>["AVX512VL", "AVX512F"],
5609
- "_mm256_mask_unpacklo_ps"=>["AVX512VL", "AVX512F"],
5610
- "_mm256_maskz_unpacklo_ps"=>["AVX512VL", "AVX512F"],
5611
- "_mm_mask_unpacklo_ps"=>["AVX512VL", "AVX512F"],
5612
- "_mm_maskz_unpacklo_ps"=>["AVX512VL", "AVX512F"],
5613
- "_mm256_mask_xor_pd"=>["AVX512VL", "AVX512DQ"],
5614
- "_mm256_maskz_xor_pd"=>["AVX512VL", "AVX512DQ"],
5513
+ "_mm256_mask_roundscale_pd"=>[["AVX512VL", "AVX512F"]],
5514
+ "_mm256_maskz_roundscale_pd"=>[["AVX512VL", "AVX512F"]],
5515
+ "_mm256_roundscale_pd"=>[["AVX512VL", "AVX512F"]],
5516
+ "_mm_mask_roundscale_pd"=>[["AVX512VL", "AVX512F"]],
5517
+ "_mm_maskz_roundscale_pd"=>[["AVX512VL", "AVX512F"]],
5518
+ "_mm_roundscale_pd"=>[["AVX512VL", "AVX512F"]],
5519
+ "_mm256_mask_roundscale_ps"=>[["AVX512VL", "AVX512F"]],
5520
+ "_mm256_maskz_roundscale_ps"=>[["AVX512VL", "AVX512F"]],
5521
+ "_mm256_roundscale_ps"=>[["AVX512VL", "AVX512F"]],
5522
+ "_mm_mask_roundscale_ps"=>[["AVX512VL", "AVX512F"]],
5523
+ "_mm_maskz_roundscale_ps"=>[["AVX512VL", "AVX512F"]],
5524
+ "_mm_roundscale_ps"=>[["AVX512VL", "AVX512F"]],
5525
+ "_mm256_mask_rsqrt14_pd"=>[["AVX512VL", "AVX512F"]],
5526
+ "_mm256_maskz_rsqrt14_pd"=>[["AVX512VL", "AVX512F"]],
5527
+ "_mm_mask_rsqrt14_pd"=>[["AVX512VL", "AVX512F"]],
5528
+ "_mm_maskz_rsqrt14_pd"=>[["AVX512VL", "AVX512F"]],
5529
+ "_mm256_mask_rsqrt14_ps"=>[["AVX512VL", "AVX512F"]],
5530
+ "_mm256_maskz_rsqrt14_ps"=>[["AVX512VL", "AVX512F"]],
5531
+ "_mm_mask_rsqrt14_ps"=>[["AVX512VL", "AVX512F"]],
5532
+ "_mm_maskz_rsqrt14_ps"=>[["AVX512VL", "AVX512F"]],
5533
+ "_mm256_mask_scalef_pd"=>[["AVX512VL", "AVX512F"]],
5534
+ "_mm256_maskz_scalef_pd"=>[["AVX512VL", "AVX512F"]],
5535
+ "_mm256_scalef_pd"=>[["AVX512VL", "AVX512F"]],
5536
+ "_mm_mask_scalef_pd"=>[["AVX512VL", "AVX512F"]],
5537
+ "_mm_maskz_scalef_pd"=>[["AVX512VL", "AVX512F"]],
5538
+ "_mm_scalef_pd"=>[["AVX512VL", "AVX512F"]],
5539
+ "_mm256_mask_scalef_ps"=>[["AVX512VL", "AVX512F"]],
5540
+ "_mm256_maskz_scalef_ps"=>[["AVX512VL", "AVX512F"]],
5541
+ "_mm256_scalef_ps"=>[["AVX512VL", "AVX512F"]],
5542
+ "_mm_mask_scalef_ps"=>[["AVX512VL", "AVX512F"]],
5543
+ "_mm_maskz_scalef_ps"=>[["AVX512VL", "AVX512F"]],
5544
+ "_mm_scalef_ps"=>[["AVX512VL", "AVX512F"]],
5545
+ "_mm256_i32scatter_pd"=>[["AVX512VL", "AVX512F"]],
5546
+ "_mm256_mask_i32scatter_pd"=>[["AVX512VL", "AVX512F"]],
5547
+ "_mm_i32scatter_pd"=>[["AVX512VL", "AVX512F"]],
5548
+ "_mm_mask_i32scatter_pd"=>[["AVX512VL", "AVX512F"]],
5549
+ "_mm256_i32scatter_ps"=>[["AVX512VL", "AVX512F"]],
5550
+ "_mm256_mask_i32scatter_ps"=>[["AVX512VL", "AVX512F"]],
5551
+ "_mm_i32scatter_ps"=>[["AVX512VL", "AVX512F"]],
5552
+ "_mm_mask_i32scatter_ps"=>[["AVX512VL", "AVX512F"]],
5553
+ "_mm256_i64scatter_pd"=>[["AVX512VL", "AVX512F"]],
5554
+ "_mm256_mask_i64scatter_pd"=>[["AVX512VL", "AVX512F"]],
5555
+ "_mm_i64scatter_pd"=>[["AVX512VL", "AVX512F"]],
5556
+ "_mm_mask_i64scatter_pd"=>[["AVX512VL", "AVX512F"]],
5557
+ "_mm256_i64scatter_ps"=>[["AVX512VL", "AVX512F"]],
5558
+ "_mm256_mask_i64scatter_ps"=>[["AVX512VL", "AVX512F"]],
5559
+ "_mm_i64scatter_ps"=>[["AVX512VL", "AVX512F"]],
5560
+ "_mm_mask_i64scatter_ps"=>[["AVX512VL", "AVX512F"]],
5561
+ "_mm256_mask_shuffle_f32x4"=>[["AVX512VL", "AVX512F"]],
5562
+ "_mm256_maskz_shuffle_f32x4"=>[["AVX512VL", "AVX512F"]],
5563
+ "_mm256_shuffle_f32x4"=>[["AVX512VL", "AVX512F"]],
5564
+ "_mm256_mask_shuffle_f64x2"=>[["AVX512VL", "AVX512F"]],
5565
+ "_mm256_maskz_shuffle_f64x2"=>[["AVX512VL", "AVX512F"]],
5566
+ "_mm256_shuffle_f64x2"=>[["AVX512VL", "AVX512F"]],
5567
+ "_mm256_mask_shuffle_i32x4"=>[["AVX512VL", "AVX512F"]],
5568
+ "_mm256_maskz_shuffle_i32x4"=>[["AVX512VL", "AVX512F"]],
5569
+ "_mm256_shuffle_i32x4"=>[["AVX512VL", "AVX512F"]],
5570
+ "_mm256_mask_shuffle_i64x2"=>[["AVX512VL", "AVX512F"]],
5571
+ "_mm256_maskz_shuffle_i64x2"=>[["AVX512VL", "AVX512F"]],
5572
+ "_mm256_shuffle_i64x2"=>[["AVX512VL", "AVX512F"]],
5573
+ "_mm256_mask_shuffle_pd"=>[["AVX512VL", "AVX512F"]],
5574
+ "_mm256_maskz_shuffle_pd"=>[["AVX512VL", "AVX512F"]],
5575
+ "_mm_mask_shuffle_pd"=>[["AVX512VL", "AVX512F"]],
5576
+ "_mm_maskz_shuffle_pd"=>[["AVX512VL", "AVX512F"]],
5577
+ "_mm256_mask_shuffle_ps"=>[["AVX512VL", "AVX512F"]],
5578
+ "_mm256_maskz_shuffle_ps"=>[["AVX512VL", "AVX512F"]],
5579
+ "_mm_mask_shuffle_ps"=>[["AVX512VL", "AVX512F"]],
5580
+ "_mm_maskz_shuffle_ps"=>[["AVX512VL", "AVX512F"]],
5581
+ "_mm256_mask_sqrt_pd"=>[["AVX512VL", "AVX512F"]],
5582
+ "_mm256_maskz_sqrt_pd"=>[["AVX512VL", "AVX512F"]],
5583
+ "_mm_mask_sqrt_pd"=>[["AVX512VL", "AVX512F"]],
5584
+ "_mm_maskz_sqrt_pd"=>[["AVX512VL", "AVX512F"]],
5585
+ "_mm256_mask_sqrt_ps"=>[["AVX512VL", "AVX512F"]],
5586
+ "_mm256_maskz_sqrt_ps"=>[["AVX512VL", "AVX512F"]],
5587
+ "_mm_mask_sqrt_ps"=>[["AVX512VL", "AVX512F"]],
5588
+ "_mm_maskz_sqrt_ps"=>[["AVX512VL", "AVX512F"]],
5589
+ "_mm256_mask_sub_pd"=>[["AVX512VL", "AVX512F"]],
5590
+ "_mm256_maskz_sub_pd"=>[["AVX512VL", "AVX512F"]],
5591
+ "_mm_mask_sub_pd"=>[["AVX512VL", "AVX512F"]],
5592
+ "_mm_maskz_sub_pd"=>[["AVX512VL", "AVX512F"]],
5593
+ "_mm256_mask_sub_ps"=>[["AVX512VL", "AVX512F"]],
5594
+ "_mm256_maskz_sub_ps"=>[["AVX512VL", "AVX512F"]],
5595
+ "_mm_mask_sub_ps"=>[["AVX512VL", "AVX512F"]],
5596
+ "_mm_maskz_sub_ps"=>[["AVX512VL", "AVX512F"]],
5597
+ "_mm256_mask_unpackhi_pd"=>[["AVX512VL", "AVX512F"]],
5598
+ "_mm256_maskz_unpackhi_pd"=>[["AVX512VL", "AVX512F"]],
5599
+ "_mm_mask_unpackhi_pd"=>[["AVX512VL", "AVX512F"]],
5600
+ "_mm_maskz_unpackhi_pd"=>[["AVX512VL", "AVX512F"]],
5601
+ "_mm256_mask_unpackhi_ps"=>[["AVX512VL", "AVX512F"]],
5602
+ "_mm256_maskz_unpackhi_ps"=>[["AVX512VL", "AVX512F"]],
5603
+ "_mm_mask_unpackhi_ps"=>[["AVX512VL", "AVX512F"]],
5604
+ "_mm_maskz_unpackhi_ps"=>[["AVX512VL", "AVX512F"]],
5605
+ "_mm256_mask_unpacklo_pd"=>[["AVX512VL", "AVX512F"]],
5606
+ "_mm256_maskz_unpacklo_pd"=>[["AVX512VL", "AVX512F"]],
5607
+ "_mm_mask_unpacklo_pd"=>[["AVX512VL", "AVX512F"]],
5608
+ "_mm_maskz_unpacklo_pd"=>[["AVX512VL", "AVX512F"]],
5609
+ "_mm256_mask_unpacklo_ps"=>[["AVX512VL", "AVX512F"]],
5610
+ "_mm256_maskz_unpacklo_ps"=>[["AVX512VL", "AVX512F"]],
5611
+ "_mm_mask_unpacklo_ps"=>[["AVX512VL", "AVX512F"]],
5612
+ "_mm_maskz_unpacklo_ps"=>[["AVX512VL", "AVX512F"]],
5613
+ "_mm256_mask_xor_pd"=>[["AVX512VL", "AVX512DQ"]],
5614
+ "_mm256_maskz_xor_pd"=>[["AVX512VL", "AVX512DQ"]],
5615
5615
  "_mm512_mask_xor_pd"=>["AVX512DQ"],
5616
5616
  "_mm512_maskz_xor_pd"=>["AVX512DQ"],
5617
5617
  "_mm512_xor_pd"=>["AVX512DQ"],
5618
- "_mm_mask_xor_pd"=>["AVX512VL", "AVX512DQ"],
5619
- "_mm_maskz_xor_pd"=>["AVX512VL", "AVX512DQ"],
5620
- "_mm256_mask_xor_ps"=>["AVX512VL", "AVX512DQ"],
5621
- "_mm256_maskz_xor_ps"=>["AVX512VL", "AVX512DQ"],
5618
+ "_mm_mask_xor_pd"=>[["AVX512VL", "AVX512DQ"]],
5619
+ "_mm_maskz_xor_pd"=>[["AVX512VL", "AVX512DQ"]],
5620
+ "_mm256_mask_xor_ps"=>[["AVX512VL", "AVX512DQ"]],
5621
+ "_mm256_maskz_xor_ps"=>[["AVX512VL", "AVX512DQ"]],
5622
5622
  "_mm512_mask_xor_ps"=>["AVX512DQ"],
5623
5623
  "_mm512_maskz_xor_ps"=>["AVX512DQ"],
5624
5624
  "_mm512_xor_ps"=>["AVX512DQ"],
5625
- "_mm_mask_xor_ps"=>["AVX512VL", "AVX512DQ"],
5626
- "_mm_maskz_xor_ps"=>["AVX512VL", "AVX512DQ"],
5625
+ "_mm_mask_xor_ps"=>[["AVX512VL", "AVX512DQ"]],
5626
+ "_mm_maskz_xor_ps"=>[["AVX512VL", "AVX512DQ"]],
5627
5627
  "_mm512_madd52lo_epu64"=>["AVX512IFMA52"],
5628
5628
  "_mm512_mask_madd52lo_epu64"=>["AVX512IFMA52"],
5629
5629
  "_mm512_maskz_madd52lo_epu64"=>["AVX512IFMA52"],
5630
- "_mm256_madd52lo_epu64"=>["AVX512IFMA52", "AVX512VL"],
5631
- "_mm256_mask_madd52lo_epu64"=>["AVX512IFMA52", "AVX512VL"],
5632
- "_mm256_maskz_madd52lo_epu64"=>["AVX512IFMA52", "AVX512VL"],
5633
- "_mm_madd52lo_epu64"=>["AVX512IFMA52", "AVX512VL"],
5634
- "_mm_mask_madd52lo_epu64"=>["AVX512IFMA52", "AVX512VL"],
5635
- "_mm_maskz_madd52lo_epu64"=>["AVX512IFMA52", "AVX512VL"],
5630
+ "_mm256_madd52lo_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5631
+ "_mm256_mask_madd52lo_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5632
+ "_mm256_maskz_madd52lo_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5633
+ "_mm_madd52lo_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5634
+ "_mm_mask_madd52lo_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5635
+ "_mm_maskz_madd52lo_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5636
5636
  "_mm512_madd52hi_epu64"=>["AVX512IFMA52"],
5637
5637
  "_mm512_mask_madd52hi_epu64"=>["AVX512IFMA52"],
5638
5638
  "_mm512_maskz_madd52hi_epu64"=>["AVX512IFMA52"],
5639
- "_mm256_madd52hi_epu64"=>["AVX512IFMA52", "AVX512VL"],
5640
- "_mm256_mask_madd52hi_epu64"=>["AVX512IFMA52", "AVX512VL"],
5641
- "_mm256_maskz_madd52hi_epu64"=>["AVX512IFMA52", "AVX512VL"],
5642
- "_mm_madd52hi_epu64"=>["AVX512IFMA52", "AVX512VL"],
5643
- "_mm_mask_madd52hi_epu64"=>["AVX512IFMA52", "AVX512VL"],
5644
- "_mm_maskz_madd52hi_epu64"=>["AVX512IFMA52", "AVX512VL"],
5639
+ "_mm256_madd52hi_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5640
+ "_mm256_mask_madd52hi_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5641
+ "_mm256_maskz_madd52hi_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5642
+ "_mm_madd52hi_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5643
+ "_mm_mask_madd52hi_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5644
+ "_mm_maskz_madd52hi_epu64"=>[["AVX512IFMA52", "AVX512VL"]],
5645
5645
  "_mm512_multishift_epi64_epi8"=>["AVX512VBMI"],
5646
5646
  "_mm512_mask_multishift_epi64_epi8"=>["AVX512VBMI"],
5647
5647
  "_mm512_maskz_multishift_epi64_epi8"=>["AVX512VBMI"],
5648
- "_mm256_multishift_epi64_epi8"=>["AVX512VBMI", "AVX512VL"],
5649
- "_mm256_mask_multishift_epi64_epi8"=>["AVX512VBMI", "AVX512VL"],
5650
- "_mm256_maskz_multishift_epi64_epi8"=>["AVX512VBMI", "AVX512VL"],
5651
- "_mm_multishift_epi64_epi8"=>["AVX512VBMI", "AVX512VL"],
5652
- "_mm_mask_multishift_epi64_epi8"=>["AVX512VBMI", "AVX512VL"],
5653
- "_mm_maskz_multishift_epi64_epi8"=>["AVX512VBMI", "AVX512VL"],
5648
+ "_mm256_multishift_epi64_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5649
+ "_mm256_mask_multishift_epi64_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5650
+ "_mm256_maskz_multishift_epi64_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5651
+ "_mm_multishift_epi64_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5652
+ "_mm_mask_multishift_epi64_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5653
+ "_mm_maskz_multishift_epi64_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5654
5654
  "_mm512_permutexvar_epi8"=>["AVX512VBMI"],
5655
5655
  "_mm512_mask_permutexvar_epi8"=>["AVX512VBMI"],
5656
5656
  "_mm512_maskz_permutexvar_epi8"=>["AVX512VBMI"],
5657
- "_mm256_permutexvar_epi8"=>["AVX512VBMI", "AVX512VL"],
5658
- "_mm256_mask_permutexvar_epi8"=>["AVX512VBMI", "AVX512VL"],
5659
- "_mm256_maskz_permutexvar_epi8"=>["AVX512VBMI", "AVX512VL"],
5660
- "_mm_permutexvar_epi8"=>["AVX512VBMI", "AVX512VL"],
5661
- "_mm_mask_permutexvar_epi8"=>["AVX512VBMI", "AVX512VL"],
5662
- "_mm_maskz_permutexvar_epi8"=>["AVX512VBMI", "AVX512VL"],
5657
+ "_mm256_permutexvar_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5658
+ "_mm256_mask_permutexvar_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5659
+ "_mm256_maskz_permutexvar_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5660
+ "_mm_permutexvar_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5661
+ "_mm_mask_permutexvar_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5662
+ "_mm_maskz_permutexvar_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5663
5663
  "_mm512_permutex2var_epi8"=>["AVX512VBMI"],
5664
5664
  "_mm512_mask_permutex2var_epi8"=>["AVX512VBMI"],
5665
5665
  "_mm512_mask2_permutex2var_epi8"=>["AVX512VBMI"],
5666
5666
  "_mm512_maskz_permutex2var_epi8"=>["AVX512VBMI"],
5667
- "_mm256_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"],
5668
- "_mm256_mask_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"],
5669
- "_mm256_mask2_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"],
5670
- "_mm256_maskz_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"],
5671
- "_mm_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"],
5672
- "_mm_mask_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"],
5673
- "_mm_mask2_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"],
5674
- "_mm_maskz_permutex2var_epi8"=>["AVX512VBMI", "AVX512VL"]}
5667
+ "_mm256_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5668
+ "_mm256_mask_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5669
+ "_mm256_mask2_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5670
+ "_mm256_maskz_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5671
+ "_mm_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5672
+ "_mm_mask_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5673
+ "_mm_mask2_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]],
5674
+ "_mm_maskz_permutex2var_epi8"=>[["AVX512VBMI", "AVX512VL"]]}
5675
5675
  private_constant :X86CPUID_by_name
5676
5676
  end