cann: support q4_0 model (#8822)

This commit is contained in:
wangshuai09
2024-08-05 12:22:30 +08:00
committed by GitHub
parent 0d6fb52be0
commit c02b0a8a4d
7 changed files with 357 additions and 45 deletions

View File

@@ -8,6 +8,8 @@
#include "aclrtlaunch_ascendc_quantize_f32_q8_0.h"
#include "aclrtlaunch_ascendc_quantize_f16_q8_0.h"
#include "aclrtlaunch_ascendc_quantize_f16_to_q4_0.h"
#include "aclrtlaunch_ascendc_quantize_f32_to_q4_0.h"
#include "aclrtlaunch_ascendc_dup_by_rows_fp16.h"
#include "aclrtlaunch_ascendc_dup_by_rows_fp32.h"