quant_config = {"zero_point": True, "q_group_size": 128, "w_bit": 4, "version":"GEMM"}