; ModuleID = '/home/hakta/Documents/matrix_mult/solution3/.autopilot/db/a.o.2.bc' target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128" target triple = "x86_64-unknown-linux-gnu" @mode5 = internal constant [10 x i8] c"s_axilite\00" @mode3 = internal constant [10 x i8] c"s_axilite\00" @mode = internal constant [10 x i8] c"s_axilite\00" @memcpy_OC_tempB_OC_B = internal unnamed_addr constant [15 x i8] c"memcpy.tempB.B\00" @memcpy_OC_tempA_OC_A = internal unnamed_addr constant [15 x i8] c"memcpy.tempA.A\00" @memcpy_OC_result_OC_s = internal unnamed_addr constant [29 x i8] c"memcpy.result.tempResult.gep\00" @matrix_mult_str = internal unnamed_addr constant [12 x i8] c"matrix_mult\00" @burstwrite_OC_region = internal unnamed_addr constant [18 x i8] c"burstwrite.region\00" @burstread_OC_region_s = internal unnamed_addr constant [17 x i8] c"burstread.region\00" @bundle6 = internal constant [1 x i8] zeroinitializer @bundle4 = internal constant [1 x i8] zeroinitializer @bundle = internal constant [1 x i8] zeroinitializer @p_str9 = internal unnamed_addr constant [1 x i8] zeroinitializer @p_str8 = internal unnamed_addr constant [1 x i8] zeroinitializer @p_str5 = private unnamed_addr constant [24 x i8] c"matrix_mult__outer_loop\00", align 1 @p_str3 = private unnamed_addr constant [10 x i8] c"s_axilite\00", align 1 @p_str2 = private unnamed_addr constant [6 x i8] c"slave\00", align 1 @p_str10 = internal unnamed_addr constant [1 x i8] zeroinitializer @p_str1 = private unnamed_addr constant [1 x i8] zeroinitializer, align 1 @p_str = private unnamed_addr constant [6 x i8] c"m_axi\00", align 1 define void @matrix_mult(i32* %gmem, i32 %A, i32 %B, i32 %result) { %result_read = call i32 @_ssdm_op_Read.s_axilite.i32(i32 %result) %B_read = call i32 @_ssdm_op_Read.s_axilite.i32(i32 %B) %A_read = call i32 @_ssdm_op_Read.s_axilite.i32(i32 %A) %result5 = call i30 @_ssdm_op_PartSelect.i30.i32.i32.i32(i32 %result_read, i32 2, i32 31) %tmp_5 = zext i30 %result5 to i64 %gmem_addr = getelementptr i32* %gmem, i64 %tmp_5 %B3 = call i30 @_ssdm_op_PartSelect.i30.i32.i32.i32(i32 %B_read, i32 2, i32 31) %tmp_6 = zext i30 %B3 to i64 %gmem_addr_1 = getelementptr i32* %gmem, i64 %tmp_6 %A1 = call i30 @_ssdm_op_PartSelect.i30.i32.i32.i32(i32 %A_read, i32 2, i32 31) %tmp_7 = zext i30 %A1 to i64 %gmem_addr_2 = getelementptr i32* %gmem, i64 %tmp_7 call void (...)* @_ssdm_op_SpecBitsMap(i32* %gmem), !map !11 call void (...)* @_ssdm_op_SpecTopModule([12 x i8]* @matrix_mult_str) nounwind %tempA_0 = alloca [32 x i32], align 4 %tempA_1 = alloca [32 x i32], align 4 %tempB_0 = alloca [32 x i32], align 4 %tempB_1 = alloca [32 x i32], align 4 %tempResult_0 = alloca [32 x i32], align 4 %tempResult_1 = alloca [32 x i32], align 4 call void (...)* @_ssdm_op_SpecInterface(i32 %result, [10 x i8]* @mode5, i32 0, i32 0, [1 x i8]* @p_str1, i32 0, i32 32, [1 x i8]* @bundle6, [6 x i8]* @p_str2, [1 x i8]* @p_str1, i32 16, i32 16, i32 16, i32 16, [1 x i8]* @p_str1, [1 x i8]* @p_str1) call void (...)* @_ssdm_op_SpecInterface(i32 %B, [10 x i8]* @mode3, i32 0, i32 0, [1 x i8]* @p_str1, i32 0, i32 32, [1 x i8]* @bundle4, [6 x i8]* @p_str2, [1 x i8]* @p_str1, i32 16, i32 16, i32 16, i32 16, [1 x i8]* @p_str1, [1 x i8]* @p_str1) call void (...)* @_ssdm_op_SpecInterface(i32* %gmem, [6 x i8]* @p_str, i32 0, i32 0, [1 x i8]* @p_str1, i32 0, i32 32, [1 x i8]* @p_str1, [6 x i8]* @p_str2, [1 x i8]* @p_str1, i32 16, i32 16, i32 16, i32 16, [1 x i8]* @p_str1, [1 x i8]* @p_str1) call void (...)* @_ssdm_op_SpecInterface(i32 %A, [10 x i8]* @mode, i32 0, i32 0, [1 x i8]* @p_str1, i32 0, i32 32, [1 x i8]* @bundle, [6 x i8]* @p_str2, [1 x i8]* @p_str1, i32 16, i32 16, i32 16, i32 16, [1 x i8]* @p_str1, [1 x i8]* @p_str1) call void (...)* @_ssdm_op_SpecInterface(i32 0, [10 x i8]* @p_str3, i32 0, i32 0, [1 x i8]* @p_str1, i32 0, i32 0, [1 x i8]* @p_str1, [1 x i8]* @p_str1, [1 x i8]* @p_str1, i32 0, i32 0, i32 0, i32 0, [1 x i8]* @p_str1, [1 x i8]* @p_str1) nounwind %gmem_addr_2_rd_req = call i1 @_ssdm_op_ReadReq.m_axi.i32P(i32* %gmem_addr_2, i32 64) br label %burst.rd.header burst.rd.header: ; preds = %burst.rd.body506, %0 %indvar = phi i7 [ 0, %0 ], [ %indvar_next, %burst.rd.body506 ] %exitcond3 = icmp eq i7 %indvar, -64 %indvar_next = add i7 %indvar, 1 br i1 %exitcond3, label %burst.rd.header7.preheader, label %burst.rd.body burst.rd.header7.preheader: ; preds = %burst.rd.header %gmem_addr_1_rd_req = call i1 @_ssdm_op_ReadReq.m_axi.i32P(i32* %gmem_addr_1, i32 64) br label %burst.rd.header7 burst.rd.body: ; preds = %burst.rd.header %empty = call i32 (...)* @_ssdm_op_SpecLoopTripCount(i64 64, i64 64, i64 64) nounwind %burstread_rbegin = call i32 (...)* @_ssdm_op_SpecRegionBegin([17 x i8]* @burstread_OC_region_s) nounwind call void (...)* @_ssdm_op_SpecPipeline(i32 1, i32 1, i32 1, i32 0, [1 x i8]* @p_str8) call void (...)* @_ssdm_op_SpecLoopName([15 x i8]* @memcpy_OC_tempA_OC_A) %gmem_addr_2_read = call i32 @_ssdm_op_Read.m_axi.i32P(i32* %gmem_addr_2) %tmp = trunc i7 %indvar to i1 %newIndex = call i6 @_ssdm_op_PartSelect.i6.i7.i32.i32(i7 %indvar, i32 1, i32 6) %newIndex1 = zext i6 %newIndex to i64 %tempA_0_addr = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex1 %tempA_1_addr = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex1 br i1 %tmp, label %branch5, label %branch4 burst.rd.body506: ; preds = %branch5, %branch4 %burstread_rend = call i32 (...)* @_ssdm_op_SpecRegionEnd([17 x i8]* @burstread_OC_region_s, i32 %burstread_rbegin) nounwind br label %burst.rd.header burst.rd.header7: ; preds = %burst.rd.header7.preheader, %burst.rd.body8420 %indvar9 = phi i7 [ %indvar_next1, %burst.rd.body8420 ], [ 0, %burst.rd.header7.preheader ] %exitcond4 = icmp eq i7 %indvar9, -64 %indvar_next1 = add i7 %indvar9, 1 br i1 %exitcond4, label %burst.rd.end6.0.preheader, label %burst.rd.body8 burst.rd.end6.0.preheader: ; preds = %burst.rd.header7 %tempB_0_addr_1 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 0 %tempB_0_load = load i32* %tempB_0_addr_1, align 16 %tempB_0_addr_2 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 4 %tempB_0_load_1 = load i32* %tempB_0_addr_2, align 16 %tempB_0_addr_3 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 8 %tempB_0_load_2 = load i32* %tempB_0_addr_3, align 16 %tempB_0_addr_4 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 12 %tempB_0_load_3 = load i32* %tempB_0_addr_4, align 16 %tempB_0_addr_5 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 16 %tempB_0_load_4 = load i32* %tempB_0_addr_5, align 16 %tempB_0_addr_6 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 20 %tempB_0_load_5 = load i32* %tempB_0_addr_6, align 16 %tempB_0_addr_7 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 24 %tempB_0_load_6 = load i32* %tempB_0_addr_7, align 16 %tempB_0_addr_8 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 28 %tempB_0_load_7 = load i32* %tempB_0_addr_8, align 16 %tempB_1_addr_1 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 0 %tempB_1_load = load i32* %tempB_1_addr_1, align 4 %tempB_1_addr_2 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 4 %tempB_1_load_1 = load i32* %tempB_1_addr_2, align 4 %tempB_1_addr_3 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 8 %tempB_1_load_2 = load i32* %tempB_1_addr_3, align 4 %tempB_1_addr_4 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 12 %tempB_1_load_3 = load i32* %tempB_1_addr_4, align 4 %tempB_1_addr_5 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 16 %tempB_1_load_4 = load i32* %tempB_1_addr_5, align 4 %tempB_1_addr_6 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 20 %tempB_1_load_5 = load i32* %tempB_1_addr_6, align 4 %tempB_1_addr_7 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 24 %tempB_1_load_6 = load i32* %tempB_1_addr_7, align 4 %tempB_1_addr_8 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 28 %tempB_1_load_7 = load i32* %tempB_1_addr_8, align 4 %tempB_0_addr_9 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 1 %tempB_0_load_8 = load i32* %tempB_0_addr_9, align 8 %tempB_0_addr_10 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 5 %tempB_0_load_9 = load i32* %tempB_0_addr_10, align 8 %tempB_0_addr_11 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 9 %tempB_0_load_10 = load i32* %tempB_0_addr_11, align 8 %tempB_0_addr_12 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 13 %tempB_0_load_11 = load i32* %tempB_0_addr_12, align 8 %tempB_0_addr_13 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 17 %tempB_0_load_12 = load i32* %tempB_0_addr_13, align 8 %tempB_0_addr_14 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 21 %tempB_0_load_13 = load i32* %tempB_0_addr_14, align 8 %tempB_0_addr_15 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 25 %tempB_0_load_14 = load i32* %tempB_0_addr_15, align 8 %tempB_0_addr_16 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 29 %tempB_0_load_15 = load i32* %tempB_0_addr_16, align 8 %tempB_1_addr_9 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 1 %tempB_1_load_8 = load i32* %tempB_1_addr_9, align 4 %tempB_1_addr_10 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 5 %tempB_1_load_9 = load i32* %tempB_1_addr_10, align 4 %tempB_1_addr_11 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 9 %tempB_1_load_10 = load i32* %tempB_1_addr_11, align 4 %tempB_1_addr_12 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 13 %tempB_1_load_11 = load i32* %tempB_1_addr_12, align 4 %tempB_1_addr_13 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 17 %tempB_1_load_12 = load i32* %tempB_1_addr_13, align 4 %tempB_1_addr_14 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 21 %tempB_1_load_13 = load i32* %tempB_1_addr_14, align 4 %tempB_1_addr_15 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 25 %tempB_1_load_14 = load i32* %tempB_1_addr_15, align 4 %tempB_1_addr_16 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 29 %tempB_1_load_15 = load i32* %tempB_1_addr_16, align 4 %tempB_0_addr_17 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 2 %tempB_0_load_16 = load i32* %tempB_0_addr_17, align 16 %tempB_0_addr_18 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 6 %tempB_0_load_17 = load i32* %tempB_0_addr_18, align 16 %tempB_0_addr_19 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 10 %tempB_0_load_18 = load i32* %tempB_0_addr_19, align 16 %tempB_0_addr_20 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 14 %tempB_0_load_19 = load i32* %tempB_0_addr_20, align 16 %tempB_0_addr_21 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 18 %tempB_0_load_20 = load i32* %tempB_0_addr_21, align 16 %tempB_0_addr_22 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 22 %tempB_0_load_21 = load i32* %tempB_0_addr_22, align 16 %tempB_0_addr_23 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 26 %tempB_0_load_22 = load i32* %tempB_0_addr_23, align 16 %tempB_0_addr_24 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 30 %tempB_0_load_23 = load i32* %tempB_0_addr_24, align 16 %tempB_1_addr_17 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 2 %tempB_1_load_16 = load i32* %tempB_1_addr_17, align 4 %tempB_1_addr_18 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 6 %tempB_1_load_17 = load i32* %tempB_1_addr_18, align 4 %tempB_1_addr_19 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 10 %tempB_1_load_18 = load i32* %tempB_1_addr_19, align 4 %tempB_1_addr_20 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 14 %tempB_1_load_19 = load i32* %tempB_1_addr_20, align 4 %tempB_1_addr_21 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 18 %tempB_1_load_20 = load i32* %tempB_1_addr_21, align 4 %tempB_1_addr_22 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 22 %tempB_1_load_21 = load i32* %tempB_1_addr_22, align 4 %tempB_1_addr_23 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 26 %tempB_1_load_22 = load i32* %tempB_1_addr_23, align 4 %tempB_1_addr_24 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 30 %tempB_1_load_23 = load i32* %tempB_1_addr_24, align 4 %tempB_0_addr_25 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 3 %tempB_0_load_24 = load i32* %tempB_0_addr_25, align 8 %tempB_0_addr_26 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 7 %tempB_0_load_25 = load i32* %tempB_0_addr_26, align 8 %tempB_0_addr_27 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 11 %tempB_0_load_26 = load i32* %tempB_0_addr_27, align 8 %tempB_0_addr_28 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 15 %tempB_0_load_27 = load i32* %tempB_0_addr_28, align 8 %tempB_0_addr_29 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 19 %tempB_0_load_28 = load i32* %tempB_0_addr_29, align 8 %tempB_0_addr_30 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 23 %tempB_0_load_29 = load i32* %tempB_0_addr_30, align 8 %tempB_0_addr_31 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 27 %tempB_0_load_30 = load i32* %tempB_0_addr_31, align 8 %tempB_0_addr_32 = getelementptr [32 x i32]* %tempB_0, i64 0, i64 31 %tempB_0_load_31 = load i32* %tempB_0_addr_32, align 8 %tempB_1_addr_25 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 3 %tempB_1_load_24 = load i32* %tempB_1_addr_25, align 4 %tempB_1_addr_26 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 7 %tempB_1_load_25 = load i32* %tempB_1_addr_26, align 4 %tempB_1_addr_27 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 11 %tempB_1_load_26 = load i32* %tempB_1_addr_27, align 4 %tempB_1_addr_28 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 15 %tempB_1_load_27 = load i32* %tempB_1_addr_28, align 4 %tempB_1_addr_29 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 19 %tempB_1_load_28 = load i32* %tempB_1_addr_29, align 4 %tempB_1_addr_30 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 23 %tempB_1_load_29 = load i32* %tempB_1_addr_30, align 4 %tempB_1_addr_31 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 27 %tempB_1_load_30 = load i32* %tempB_1_addr_31, align 4 %tempB_1_addr_32 = getelementptr [32 x i32]* %tempB_1, i64 0, i64 31 %tempB_1_load_31 = load i32* %tempB_1_addr_32, align 4 br label %burst.rd.end6.0 burst.rd.body8: ; preds = %burst.rd.header7 %empty_7 = call i32 (...)* @_ssdm_op_SpecLoopTripCount(i64 64, i64 64, i64 64) nounwind %burstread_rbegin1 = call i32 (...)* @_ssdm_op_SpecRegionBegin([17 x i8]* @burstread_OC_region_s) nounwind call void (...)* @_ssdm_op_SpecPipeline(i32 1, i32 1, i32 1, i32 0, [1 x i8]* @p_str9) call void (...)* @_ssdm_op_SpecLoopName([15 x i8]* @memcpy_OC_tempB_OC_B) %gmem_addr_1_read = call i32 @_ssdm_op_Read.m_axi.i32P(i32* %gmem_addr_1) %tmp_1 = trunc i7 %indvar9 to i1 %newIndex2 = call i6 @_ssdm_op_PartSelect.i6.i7.i32.i32(i7 %indvar9, i32 1, i32 6) %newIndex3 = zext i6 %newIndex2 to i64 %tempB_0_addr = getelementptr [32 x i32]* %tempB_0, i64 0, i64 %newIndex3 %tempB_1_addr = getelementptr [32 x i32]* %tempB_1, i64 0, i64 %newIndex3 br i1 %tmp_1, label %branch3, label %branch2 burst.rd.body8420: ; preds = %branch3, %branch2 %burstread_rend14 = call i32 (...)* @_ssdm_op_SpecRegionEnd([17 x i8]* @burstread_OC_region_s, i32 %burstread_rbegin1) nounwind br label %burst.rd.header7 burst.rd.end6.0: ; preds = %burst.rd.end6.1, %burst.rd.end6.0.preheader %i = phi i4 [ %i_1_1, %burst.rd.end6.1 ], [ 0, %burst.rd.end6.0.preheader ] %exitcond2 = icmp eq i4 %i, -8 br i1 %exitcond2, label %burst.wr.header.preheader, label %burst.rd.end6.1 burst.wr.header.preheader: ; preds = %burst.rd.end6.0 %gmem_addr_wr_req = call i1 @_ssdm_op_WriteReq.m_axi.i32P(i32* %gmem_addr, i32 64) br label %burst.wr.header burst.rd.end6.1: ; preds = %burst.rd.end6.0 %empty_8 = call i32 (...)* @_ssdm_op_SpecLoopTripCount(i64 4, i64 4, i64 4) nounwind call void (...)* @_ssdm_op_SpecLoopName([24 x i8]* @p_str5) nounwind %tmp_2 = call i32 (...)* @_ssdm_op_SpecRegionBegin([24 x i8]* @p_str5) nounwind call void (...)* @_ssdm_op_SpecPipeline(i32 -1, i32 1, i32 1, i32 0, [1 x i8]* @p_str1) nounwind %tmp_3 = trunc i4 %i to i3 %tmp_4 = call i5 @_ssdm_op_BitConcatenate.i5.i3.i2(i3 %tmp_3, i2 0) %newIndex5 = zext i5 %tmp_4 to i64 %tempResult_0_addr = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex5 %tempA_0_addr_1 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex5 %tempA_0_load = load i32* %tempA_0_addr_1, align 16 %tmp_s = mul nsw i32 %tempB_0_load, %tempA_0_load %tempA_1_addr_1 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex5 %tempA_1_load = load i32* %tempA_1_addr_1, align 4 %tmp_10_0_0_1 = mul nsw i32 %tempB_0_load_1, %tempA_1_load %newIndex6 = or i5 %tmp_4, 1 %newIndex7 = zext i5 %newIndex6 to i64 %tempA_0_addr_2 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex7 %tempA_0_load_1 = load i32* %tempA_0_addr_2, align 8 %tmp_10_0_0_2 = mul nsw i32 %tempB_0_load_2, %tempA_0_load_1 %tempA_1_addr_2 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex7 %tempA_1_load_1 = load i32* %tempA_1_addr_2, align 4 %tmp_10_0_0_3 = mul nsw i32 %tempB_0_load_3, %tempA_1_load_1 %newIndex8 = or i5 %tmp_4, 2 %newIndex9 = zext i5 %newIndex8 to i64 %tempA_0_addr_3 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex9 %tempA_0_load_2 = load i32* %tempA_0_addr_3, align 16 %tmp_10_0_0_4 = mul nsw i32 %tempB_0_load_4, %tempA_0_load_2 %tempA_1_addr_3 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex9 %tempA_1_load_2 = load i32* %tempA_1_addr_3, align 4 %tmp_10_0_0_5 = mul nsw i32 %tempB_0_load_5, %tempA_1_load_2 %newIndex4 = or i5 %tmp_4, 3 %newIndex10 = zext i5 %newIndex4 to i64 %tempA_0_addr_4 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex10 %tempA_0_load_3 = load i32* %tempA_0_addr_4, align 8 %tmp_10_0_0_6 = mul nsw i32 %tempB_0_load_6, %tempA_0_load_3 %tempA_1_addr_4 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex10 %tempA_1_load_3 = load i32* %tempA_1_addr_4, align 4 %tmp_10_0_0_7 = mul nsw i32 %tempB_0_load_7, %tempA_1_load_3 %tmp2 = add i32 %tmp_s, %tmp_10_0_0_1 %tmp3 = add i32 %tmp_10_0_0_3, %tmp_10_0_0_2 %tmp1 = add i32 %tmp2, %tmp3 %tmp5 = add i32 %tmp_10_0_0_5, %tmp_10_0_0_4 %tmp6 = add i32 %tmp_10_0_0_7, %tmp_10_0_0_6 %tmp4 = add i32 %tmp5, %tmp6 %tmp_11_0_0_7 = add nsw i32 %tmp1, %tmp4 store i32 %tmp_11_0_0_7, i32* %tempResult_0_addr, align 16 %tempResult_1_addr = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex5 %tmp_10_0_1 = mul nsw i32 %tempB_1_load, %tempA_0_load %tmp_10_0_1_1 = mul nsw i32 %tempB_1_load_1, %tempA_1_load %tmp_10_0_1_2 = mul nsw i32 %tempB_1_load_2, %tempA_0_load_1 %tmp_10_0_1_3 = mul nsw i32 %tempB_1_load_3, %tempA_1_load_1 %tmp_10_0_1_4 = mul nsw i32 %tempB_1_load_4, %tempA_0_load_2 %tmp_10_0_1_5 = mul nsw i32 %tempB_1_load_5, %tempA_1_load_2 %tmp_10_0_1_6 = mul nsw i32 %tempB_1_load_6, %tempA_0_load_3 %tmp_10_0_1_7 = mul nsw i32 %tempB_1_load_7, %tempA_1_load_3 %tmp8 = add i32 %tmp_10_0_1, %tmp_10_0_1_1 %tmp9 = add i32 %tmp_10_0_1_3, %tmp_10_0_1_2 %tmp7 = add i32 %tmp8, %tmp9 %tmp11 = add i32 %tmp_10_0_1_5, %tmp_10_0_1_4 %tmp12 = add i32 %tmp_10_0_1_7, %tmp_10_0_1_6 %tmp10 = add i32 %tmp11, %tmp12 %tmp_11_0_1_7 = add nsw i32 %tmp7, %tmp10 store i32 %tmp_11_0_1_7, i32* %tempResult_1_addr, align 4 %tempResult_0_addr_1 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex7 %tmp_10_0_2 = mul nsw i32 %tempB_0_load_8, %tempA_0_load %tmp_10_0_2_1 = mul nsw i32 %tempB_0_load_9, %tempA_1_load %tmp_10_0_2_2 = mul nsw i32 %tempB_0_load_10, %tempA_0_load_1 %tmp_10_0_2_3 = mul nsw i32 %tempB_0_load_11, %tempA_1_load_1 %tmp_10_0_2_4 = mul nsw i32 %tempB_0_load_12, %tempA_0_load_2 %tmp_10_0_2_5 = mul nsw i32 %tempB_0_load_13, %tempA_1_load_2 %tmp_10_0_2_6 = mul nsw i32 %tempB_0_load_14, %tempA_0_load_3 %tmp_10_0_2_7 = mul nsw i32 %tempB_0_load_15, %tempA_1_load_3 %tmp14 = add i32 %tmp_10_0_2, %tmp_10_0_2_1 %tmp15 = add i32 %tmp_10_0_2_3, %tmp_10_0_2_2 %tmp13 = add i32 %tmp14, %tmp15 %tmp17 = add i32 %tmp_10_0_2_5, %tmp_10_0_2_4 %tmp18 = add i32 %tmp_10_0_2_7, %tmp_10_0_2_6 %tmp16 = add i32 %tmp17, %tmp18 %tmp_11_0_2_7 = add nsw i32 %tmp13, %tmp16 store i32 %tmp_11_0_2_7, i32* %tempResult_0_addr_1, align 8 %tempResult_1_addr_1 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex7 %tmp_10_0_3 = mul nsw i32 %tempB_1_load_8, %tempA_0_load %tmp_10_0_3_1 = mul nsw i32 %tempB_1_load_9, %tempA_1_load %tmp_10_0_3_2 = mul nsw i32 %tempB_1_load_10, %tempA_0_load_1 %tmp_10_0_3_3 = mul nsw i32 %tempB_1_load_11, %tempA_1_load_1 %tmp_10_0_3_4 = mul nsw i32 %tempB_1_load_12, %tempA_0_load_2 %tmp_10_0_3_5 = mul nsw i32 %tempB_1_load_13, %tempA_1_load_2 %tmp_10_0_3_6 = mul nsw i32 %tempB_1_load_14, %tempA_0_load_3 %tmp_10_0_3_7 = mul nsw i32 %tempB_1_load_15, %tempA_1_load_3 %tmp20 = add i32 %tmp_10_0_3, %tmp_10_0_3_1 %tmp21 = add i32 %tmp_10_0_3_3, %tmp_10_0_3_2 %tmp19 = add i32 %tmp20, %tmp21 %tmp23 = add i32 %tmp_10_0_3_5, %tmp_10_0_3_4 %tmp24 = add i32 %tmp_10_0_3_7, %tmp_10_0_3_6 %tmp22 = add i32 %tmp23, %tmp24 %tmp_11_0_3_7 = add nsw i32 %tmp19, %tmp22 store i32 %tmp_11_0_3_7, i32* %tempResult_1_addr_1, align 4 %tempResult_0_addr_2 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex9 %tmp_10_0_4 = mul nsw i32 %tempB_0_load_16, %tempA_0_load %tmp_10_0_4_1 = mul nsw i32 %tempB_0_load_17, %tempA_1_load %tmp_10_0_4_2 = mul nsw i32 %tempB_0_load_18, %tempA_0_load_1 %tmp_10_0_4_3 = mul nsw i32 %tempB_0_load_19, %tempA_1_load_1 %tmp_10_0_4_4 = mul nsw i32 %tempB_0_load_20, %tempA_0_load_2 %tmp_10_0_4_5 = mul nsw i32 %tempB_0_load_21, %tempA_1_load_2 %tmp_10_0_4_6 = mul nsw i32 %tempB_0_load_22, %tempA_0_load_3 %tmp_10_0_4_7 = mul nsw i32 %tempB_0_load_23, %tempA_1_load_3 %tmp26 = add i32 %tmp_10_0_4, %tmp_10_0_4_1 %tmp27 = add i32 %tmp_10_0_4_3, %tmp_10_0_4_2 %tmp25 = add i32 %tmp26, %tmp27 %tmp29 = add i32 %tmp_10_0_4_5, %tmp_10_0_4_4 %tmp30 = add i32 %tmp_10_0_4_7, %tmp_10_0_4_6 %tmp28 = add i32 %tmp29, %tmp30 %tmp_11_0_4_7 = add nsw i32 %tmp25, %tmp28 store i32 %tmp_11_0_4_7, i32* %tempResult_0_addr_2, align 16 %tempResult_1_addr_2 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex9 %tmp_10_0_5 = mul nsw i32 %tempB_1_load_16, %tempA_0_load %tmp_10_0_5_1 = mul nsw i32 %tempB_1_load_17, %tempA_1_load %tmp_10_0_5_2 = mul nsw i32 %tempB_1_load_18, %tempA_0_load_1 %tmp_10_0_5_3 = mul nsw i32 %tempB_1_load_19, %tempA_1_load_1 %tmp_10_0_5_4 = mul nsw i32 %tempB_1_load_20, %tempA_0_load_2 %tmp_10_0_5_5 = mul nsw i32 %tempB_1_load_21, %tempA_1_load_2 %tmp_10_0_5_6 = mul nsw i32 %tempB_1_load_22, %tempA_0_load_3 %tmp_10_0_5_7 = mul nsw i32 %tempB_1_load_23, %tempA_1_load_3 %tmp32 = add i32 %tmp_10_0_5, %tmp_10_0_5_1 %tmp33 = add i32 %tmp_10_0_5_3, %tmp_10_0_5_2 %tmp31 = add i32 %tmp32, %tmp33 %tmp35 = add i32 %tmp_10_0_5_5, %tmp_10_0_5_4 %tmp36 = add i32 %tmp_10_0_5_7, %tmp_10_0_5_6 %tmp34 = add i32 %tmp35, %tmp36 %tmp_11_0_5_7 = add nsw i32 %tmp31, %tmp34 store i32 %tmp_11_0_5_7, i32* %tempResult_1_addr_2, align 4 %tempResult_0_addr_3 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex10 %tmp_10_0_6 = mul nsw i32 %tempB_0_load_24, %tempA_0_load %tmp_10_0_6_1 = mul nsw i32 %tempB_0_load_25, %tempA_1_load %tmp_10_0_6_2 = mul nsw i32 %tempB_0_load_26, %tempA_0_load_1 %tmp_10_0_6_3 = mul nsw i32 %tempB_0_load_27, %tempA_1_load_1 %tmp_10_0_6_4 = mul nsw i32 %tempB_0_load_28, %tempA_0_load_2 %tmp_10_0_6_5 = mul nsw i32 %tempB_0_load_29, %tempA_1_load_2 %tmp_10_0_6_6 = mul nsw i32 %tempB_0_load_30, %tempA_0_load_3 %tmp_10_0_6_7 = mul nsw i32 %tempB_0_load_31, %tempA_1_load_3 %tmp38 = add i32 %tmp_10_0_6, %tmp_10_0_6_1 %tmp39 = add i32 %tmp_10_0_6_3, %tmp_10_0_6_2 %tmp37 = add i32 %tmp38, %tmp39 %tmp41 = add i32 %tmp_10_0_6_5, %tmp_10_0_6_4 %tmp42 = add i32 %tmp_10_0_6_7, %tmp_10_0_6_6 %tmp40 = add i32 %tmp41, %tmp42 %tmp_11_0_6_7 = add nsw i32 %tmp37, %tmp40 store i32 %tmp_11_0_6_7, i32* %tempResult_0_addr_3, align 8 %tempResult_1_addr_3 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex10 %tmp_10_0_7 = mul nsw i32 %tempB_1_load_24, %tempA_0_load %tmp_10_0_7_1 = mul nsw i32 %tempB_1_load_25, %tempA_1_load %tmp_10_0_7_2 = mul nsw i32 %tempB_1_load_26, %tempA_0_load_1 %tmp_10_0_7_3 = mul nsw i32 %tempB_1_load_27, %tempA_1_load_1 %tmp_10_0_7_4 = mul nsw i32 %tempB_1_load_28, %tempA_0_load_2 %tmp_10_0_7_5 = mul nsw i32 %tempB_1_load_29, %tempA_1_load_2 %tmp_10_0_7_6 = mul nsw i32 %tempB_1_load_30, %tempA_0_load_3 %tmp_10_0_7_7 = mul nsw i32 %tempB_1_load_31, %tempA_1_load_3 %tmp44 = add i32 %tmp_10_0_7, %tmp_10_0_7_1 %tmp45 = add i32 %tmp_10_0_7_3, %tmp_10_0_7_2 %tmp43 = add i32 %tmp44, %tmp45 %tmp47 = add i32 %tmp_10_0_7_5, %tmp_10_0_7_4 %tmp48 = add i32 %tmp_10_0_7_7, %tmp_10_0_7_6 %tmp46 = add i32 %tmp47, %tmp48 %tmp_11_0_7_7 = add nsw i32 %tmp43, %tmp46 store i32 %tmp_11_0_7_7, i32* %tempResult_1_addr_3, align 4 %empty_9 = call i32 (...)* @_ssdm_op_SpecRegionEnd([24 x i8]* @p_str5, i32 %tmp_2) nounwind %newIndex11 = or i5 %tmp_4, 4 %newIndex12 = zext i5 %newIndex11 to i64 %tempResult_0_addr_4 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex12 %tempA_0_addr_5 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex12 %tempA_0_load_4 = load i32* %tempA_0_addr_5, align 16 %tmp_10_1 = mul nsw i32 %tempB_0_load, %tempA_0_load_4 %tempA_1_addr_5 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex12 %tempA_1_load_4 = load i32* %tempA_1_addr_5, align 4 %tmp_10_1_0_1 = mul nsw i32 %tempB_0_load_1, %tempA_1_load_4 %newIndex13 = or i5 %tmp_4, 5 %newIndex14 = zext i5 %newIndex13 to i64 %tempA_0_addr_6 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex14 %tempA_0_load_5 = load i32* %tempA_0_addr_6, align 8 %tmp_10_1_0_2 = mul nsw i32 %tempB_0_load_2, %tempA_0_load_5 %tempA_1_addr_6 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex14 %tempA_1_load_5 = load i32* %tempA_1_addr_6, align 4 %tmp_10_1_0_3 = mul nsw i32 %tempB_0_load_3, %tempA_1_load_5 %newIndex15 = or i5 %tmp_4, 6 %newIndex16 = zext i5 %newIndex15 to i64 %tempA_0_addr_7 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex16 %tempA_0_load_6 = load i32* %tempA_0_addr_7, align 16 %tmp_10_1_0_4 = mul nsw i32 %tempB_0_load_4, %tempA_0_load_6 %tempA_1_addr_7 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex16 %tempA_1_load_6 = load i32* %tempA_1_addr_7, align 4 %tmp_10_1_0_5 = mul nsw i32 %tempB_0_load_5, %tempA_1_load_6 %newIndex17 = or i5 %tmp_4, 7 %newIndex18 = zext i5 %newIndex17 to i64 %tempA_0_addr_8 = getelementptr [32 x i32]* %tempA_0, i64 0, i64 %newIndex18 %tempA_0_load_7 = load i32* %tempA_0_addr_8, align 8 %tmp_10_1_0_6 = mul nsw i32 %tempB_0_load_6, %tempA_0_load_7 %tempA_1_addr_8 = getelementptr [32 x i32]* %tempA_1, i64 0, i64 %newIndex18 %tempA_1_load_7 = load i32* %tempA_1_addr_8, align 4 %tmp_10_1_0_7 = mul nsw i32 %tempB_0_load_7, %tempA_1_load_7 %tmp50 = add i32 %tmp_10_1, %tmp_10_1_0_1 %tmp51 = add i32 %tmp_10_1_0_3, %tmp_10_1_0_2 %tmp49 = add i32 %tmp50, %tmp51 %tmp53 = add i32 %tmp_10_1_0_5, %tmp_10_1_0_4 %tmp54 = add i32 %tmp_10_1_0_7, %tmp_10_1_0_6 %tmp52 = add i32 %tmp53, %tmp54 %tmp_11_1_0_7 = add nsw i32 %tmp49, %tmp52 store i32 %tmp_11_1_0_7, i32* %tempResult_0_addr_4, align 16 %tempResult_1_addr_4 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex12 %tmp_10_1_1 = mul nsw i32 %tempB_1_load, %tempA_0_load_4 %tmp_10_1_1_1 = mul nsw i32 %tempB_1_load_1, %tempA_1_load_4 %tmp_10_1_1_2 = mul nsw i32 %tempB_1_load_2, %tempA_0_load_5 %tmp_10_1_1_3 = mul nsw i32 %tempB_1_load_3, %tempA_1_load_5 %tmp_10_1_1_4 = mul nsw i32 %tempB_1_load_4, %tempA_0_load_6 %tmp_10_1_1_5 = mul nsw i32 %tempB_1_load_5, %tempA_1_load_6 %tmp_10_1_1_6 = mul nsw i32 %tempB_1_load_6, %tempA_0_load_7 %tmp_10_1_1_7 = mul nsw i32 %tempB_1_load_7, %tempA_1_load_7 %tmp56 = add i32 %tmp_10_1_1, %tmp_10_1_1_1 %tmp57 = add i32 %tmp_10_1_1_3, %tmp_10_1_1_2 %tmp55 = add i32 %tmp56, %tmp57 %tmp59 = add i32 %tmp_10_1_1_5, %tmp_10_1_1_4 %tmp60 = add i32 %tmp_10_1_1_7, %tmp_10_1_1_6 %tmp58 = add i32 %tmp59, %tmp60 %tmp_11_1_1_7 = add nsw i32 %tmp55, %tmp58 store i32 %tmp_11_1_1_7, i32* %tempResult_1_addr_4, align 4 %tempResult_0_addr_5 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex14 %tmp_10_1_2 = mul nsw i32 %tempB_0_load_8, %tempA_0_load_4 %tmp_10_1_2_1 = mul nsw i32 %tempB_0_load_9, %tempA_1_load_4 %tmp_10_1_2_2 = mul nsw i32 %tempB_0_load_10, %tempA_0_load_5 %tmp_10_1_2_3 = mul nsw i32 %tempB_0_load_11, %tempA_1_load_5 %tmp_10_1_2_4 = mul nsw i32 %tempB_0_load_12, %tempA_0_load_6 %tmp_10_1_2_5 = mul nsw i32 %tempB_0_load_13, %tempA_1_load_6 %tmp_10_1_2_6 = mul nsw i32 %tempB_0_load_14, %tempA_0_load_7 %tmp_10_1_2_7 = mul nsw i32 %tempB_0_load_15, %tempA_1_load_7 %tmp62 = add i32 %tmp_10_1_2, %tmp_10_1_2_1 %tmp63 = add i32 %tmp_10_1_2_3, %tmp_10_1_2_2 %tmp61 = add i32 %tmp62, %tmp63 %tmp65 = add i32 %tmp_10_1_2_5, %tmp_10_1_2_4 %tmp66 = add i32 %tmp_10_1_2_7, %tmp_10_1_2_6 %tmp64 = add i32 %tmp65, %tmp66 %tmp_11_1_2_7 = add nsw i32 %tmp61, %tmp64 store i32 %tmp_11_1_2_7, i32* %tempResult_0_addr_5, align 8 %tempResult_1_addr_5 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex14 %tmp_10_1_3 = mul nsw i32 %tempB_1_load_8, %tempA_0_load_4 %tmp_10_1_3_1 = mul nsw i32 %tempB_1_load_9, %tempA_1_load_4 %tmp_10_1_3_2 = mul nsw i32 %tempB_1_load_10, %tempA_0_load_5 %tmp_10_1_3_3 = mul nsw i32 %tempB_1_load_11, %tempA_1_load_5 %tmp_10_1_3_4 = mul nsw i32 %tempB_1_load_12, %tempA_0_load_6 %tmp_10_1_3_5 = mul nsw i32 %tempB_1_load_13, %tempA_1_load_6 %tmp_10_1_3_6 = mul nsw i32 %tempB_1_load_14, %tempA_0_load_7 %tmp_10_1_3_7 = mul nsw i32 %tempB_1_load_15, %tempA_1_load_7 %tmp68 = add i32 %tmp_10_1_3, %tmp_10_1_3_1 %tmp69 = add i32 %tmp_10_1_3_3, %tmp_10_1_3_2 %tmp67 = add i32 %tmp68, %tmp69 %tmp71 = add i32 %tmp_10_1_3_5, %tmp_10_1_3_4 %tmp72 = add i32 %tmp_10_1_3_7, %tmp_10_1_3_6 %tmp70 = add i32 %tmp71, %tmp72 %tmp_11_1_3_7 = add nsw i32 %tmp67, %tmp70 store i32 %tmp_11_1_3_7, i32* %tempResult_1_addr_5, align 4 %tempResult_0_addr_6 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex16 %tmp_10_1_4 = mul nsw i32 %tempB_0_load_16, %tempA_0_load_4 %tmp_10_1_4_1 = mul nsw i32 %tempB_0_load_17, %tempA_1_load_4 %tmp_10_1_4_2 = mul nsw i32 %tempB_0_load_18, %tempA_0_load_5 %tmp_10_1_4_3 = mul nsw i32 %tempB_0_load_19, %tempA_1_load_5 %tmp_10_1_4_4 = mul nsw i32 %tempB_0_load_20, %tempA_0_load_6 %tmp_10_1_4_5 = mul nsw i32 %tempB_0_load_21, %tempA_1_load_6 %tmp_10_1_4_6 = mul nsw i32 %tempB_0_load_22, %tempA_0_load_7 %tmp_10_1_4_7 = mul nsw i32 %tempB_0_load_23, %tempA_1_load_7 %tmp74 = add i32 %tmp_10_1_4, %tmp_10_1_4_1 %tmp75 = add i32 %tmp_10_1_4_3, %tmp_10_1_4_2 %tmp73 = add i32 %tmp74, %tmp75 %tmp77 = add i32 %tmp_10_1_4_5, %tmp_10_1_4_4 %tmp78 = add i32 %tmp_10_1_4_7, %tmp_10_1_4_6 %tmp76 = add i32 %tmp77, %tmp78 %tmp_11_1_4_7 = add nsw i32 %tmp73, %tmp76 store i32 %tmp_11_1_4_7, i32* %tempResult_0_addr_6, align 16 %tempResult_1_addr_6 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex16 %tmp_10_1_5 = mul nsw i32 %tempB_1_load_16, %tempA_0_load_4 %tmp_10_1_5_1 = mul nsw i32 %tempB_1_load_17, %tempA_1_load_4 %tmp_10_1_5_2 = mul nsw i32 %tempB_1_load_18, %tempA_0_load_5 %tmp_10_1_5_3 = mul nsw i32 %tempB_1_load_19, %tempA_1_load_5 %tmp_10_1_5_4 = mul nsw i32 %tempB_1_load_20, %tempA_0_load_6 %tmp_10_1_5_5 = mul nsw i32 %tempB_1_load_21, %tempA_1_load_6 %tmp_10_1_5_6 = mul nsw i32 %tempB_1_load_22, %tempA_0_load_7 %tmp_10_1_5_7 = mul nsw i32 %tempB_1_load_23, %tempA_1_load_7 %tmp80 = add i32 %tmp_10_1_5, %tmp_10_1_5_1 %tmp81 = add i32 %tmp_10_1_5_3, %tmp_10_1_5_2 %tmp79 = add i32 %tmp80, %tmp81 %tmp83 = add i32 %tmp_10_1_5_5, %tmp_10_1_5_4 %tmp84 = add i32 %tmp_10_1_5_7, %tmp_10_1_5_6 %tmp82 = add i32 %tmp83, %tmp84 %tmp_11_1_5_7 = add nsw i32 %tmp79, %tmp82 store i32 %tmp_11_1_5_7, i32* %tempResult_1_addr_6, align 4 %tempResult_0_addr_7 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex18 %tmp_10_1_6 = mul nsw i32 %tempB_0_load_24, %tempA_0_load_4 %tmp_10_1_6_1 = mul nsw i32 %tempB_0_load_25, %tempA_1_load_4 %tmp_10_1_6_2 = mul nsw i32 %tempB_0_load_26, %tempA_0_load_5 %tmp_10_1_6_3 = mul nsw i32 %tempB_0_load_27, %tempA_1_load_5 %tmp_10_1_6_4 = mul nsw i32 %tempB_0_load_28, %tempA_0_load_6 %tmp_10_1_6_5 = mul nsw i32 %tempB_0_load_29, %tempA_1_load_6 %tmp_10_1_6_6 = mul nsw i32 %tempB_0_load_30, %tempA_0_load_7 %tmp_10_1_6_7 = mul nsw i32 %tempB_0_load_31, %tempA_1_load_7 %tmp86 = add i32 %tmp_10_1_6, %tmp_10_1_6_1 %tmp87 = add i32 %tmp_10_1_6_3, %tmp_10_1_6_2 %tmp85 = add i32 %tmp86, %tmp87 %tmp89 = add i32 %tmp_10_1_6_5, %tmp_10_1_6_4 %tmp90 = add i32 %tmp_10_1_6_7, %tmp_10_1_6_6 %tmp88 = add i32 %tmp89, %tmp90 %tmp_11_1_6_7 = add nsw i32 %tmp85, %tmp88 store i32 %tmp_11_1_6_7, i32* %tempResult_0_addr_7, align 8 %tempResult_1_addr_7 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex18 %tmp_10_1_7 = mul nsw i32 %tempB_1_load_24, %tempA_0_load_4 %tmp_10_1_7_1 = mul nsw i32 %tempB_1_load_25, %tempA_1_load_4 %tmp_10_1_7_2 = mul nsw i32 %tempB_1_load_26, %tempA_0_load_5 %tmp_10_1_7_3 = mul nsw i32 %tempB_1_load_27, %tempA_1_load_5 %tmp_10_1_7_4 = mul nsw i32 %tempB_1_load_28, %tempA_0_load_6 %tmp_10_1_7_5 = mul nsw i32 %tempB_1_load_29, %tempA_1_load_6 %tmp_10_1_7_6 = mul nsw i32 %tempB_1_load_30, %tempA_0_load_7 %tmp_10_1_7_7 = mul nsw i32 %tempB_1_load_31, %tempA_1_load_7 %tmp92 = add i32 %tmp_10_1_7, %tmp_10_1_7_1 %tmp93 = add i32 %tmp_10_1_7_3, %tmp_10_1_7_2 %tmp91 = add i32 %tmp92, %tmp93 %tmp95 = add i32 %tmp_10_1_7_5, %tmp_10_1_7_4 %tmp96 = add i32 %tmp_10_1_7_7, %tmp_10_1_7_6 %tmp94 = add i32 %tmp95, %tmp96 %tmp_11_1_7_7 = add nsw i32 %tmp91, %tmp94 store i32 %tmp_11_1_7_7, i32* %tempResult_1_addr_7, align 4 %i_1_1 = add i4 2, %i br label %burst.rd.end6.0 burst.wr.header: ; preds = %burst.wr.header.preheader, %burst.wr.body_ifconv %indvar1 = phi i7 [ %indvar_next2, %burst.wr.body_ifconv ], [ 0, %burst.wr.header.preheader ] %exitcond5 = icmp eq i7 %indvar1, -64 %indvar_next2 = add i7 %indvar1, 1 br i1 %exitcond5, label %memcpy.tail, label %burst.wr.body_ifconv burst.wr.body_ifconv: ; preds = %burst.wr.header %empty_10 = call i32 (...)* @_ssdm_op_SpecLoopTripCount(i64 64, i64 64, i64 64) nounwind %burstwrite_rbegin = call i32 (...)* @_ssdm_op_SpecRegionBegin([18 x i8]* @burstwrite_OC_region) nounwind call void (...)* @_ssdm_op_SpecPipeline(i32 1, i32 1, i32 1, i32 0, [1 x i8]* @p_str10) call void (...)* @_ssdm_op_SpecLoopName([29 x i8]* @memcpy_OC_result_OC_s) %tmp_97 = trunc i7 %indvar1 to i1 %newIndex19 = call i6 @_ssdm_op_PartSelect.i6.i7.i32.i32(i7 %indvar1, i32 1, i32 6) %newIndex20 = zext i6 %newIndex19 to i64 %tempResult_0_addr_8 = getelementptr [32 x i32]* %tempResult_0, i64 0, i64 %newIndex20 %tempResult_1_addr_8 = getelementptr [32 x i32]* %tempResult_1, i64 0, i64 %newIndex20 %tempResult_1_load = load i32* %tempResult_1_addr_8, align 4 %tempResult_0_load = load i32* %tempResult_0_addr_8, align 4 %tempResult_load_phi = select i1 %tmp_97, i32 %tempResult_1_load, i32 %tempResult_0_load call void @_ssdm_op_Write.m_axi.i32P(i32* %gmem_addr, i32 %tempResult_load_phi, i4 -1) %burstwrite_rend = call i32 (...)* @_ssdm_op_SpecRegionEnd([18 x i8]* @burstwrite_OC_region, i32 %burstwrite_rbegin) nounwind br label %burst.wr.header memcpy.tail: ; preds = %burst.wr.header %gmem_addr_wr_resp = call i1 @_ssdm_op_WriteResp.m_axi.i32P(i32* %gmem_addr) ret void branch2: ; preds = %burst.rd.body8 store i32 %gmem_addr_1_read, i32* %tempB_0_addr, align 4 br label %burst.rd.body8420 branch3: ; preds = %burst.rd.body8 store i32 %gmem_addr_1_read, i32* %tempB_1_addr, align 4 br label %burst.rd.body8420 branch4: ; preds = %burst.rd.body store i32 %gmem_addr_2_read, i32* %tempA_0_addr, align 4 br label %burst.rd.body506 branch5: ; preds = %burst.rd.body store i32 %gmem_addr_2_read, i32* %tempA_1_addr, align 4 br label %burst.rd.body506 } declare i7 @llvm.part.select.i7(i7, i32, i32) nounwind readnone declare i32 @llvm.part.select.i32(i32, i32, i32) nounwind readnone declare void @llvm.dbg.value(metadata, i64, metadata) nounwind readnone declare void @llvm.dbg.declare(metadata, metadata) nounwind readnone define weak i1 @_ssdm_op_WriteResp.m_axi.i32P(i32*) { entry: ret i1 true } define weak i1 @_ssdm_op_WriteReq.m_axi.i32P(i32*, i32) { entry: ret i1 true } define weak void @_ssdm_op_Write.m_axi.i32P(i32*, i32, i4) { entry: ret void } define weak void @_ssdm_op_SpecTopModule(...) { entry: ret void } define weak i32 @_ssdm_op_SpecRegionEnd(...) { entry: ret i32 0 } define weak i32 @_ssdm_op_SpecRegionBegin(...) { entry: ret i32 0 } define weak void @_ssdm_op_SpecPipeline(...) nounwind { entry: ret void } define weak i32 @_ssdm_op_SpecLoopTripCount(...) { entry: ret i32 0 } define weak void @_ssdm_op_SpecLoopName(...) nounwind { entry: ret void } define weak void @_ssdm_op_SpecInterface(...) nounwind { entry: ret void } define weak void @_ssdm_op_SpecBitsMap(...) { entry: ret void } define weak i1 @_ssdm_op_ReadReq.m_axi.i32P(i32*, i32) { entry: ret i1 true } define weak i32 @_ssdm_op_Read.s_axilite.i32(i32) { entry: ret i32 %0 } define weak i32 @_ssdm_op_Read.m_axi.i32P(i32*) { entry: %empty = load i32* %0 ret i32 %empty } define weak i6 @_ssdm_op_PartSelect.i6.i7.i32.i32(i7, i32, i32) nounwind readnone { entry: %empty = call i7 @llvm.part.select.i7(i7 %0, i32 %1, i32 %2) %empty_11 = trunc i7 %empty to i6 ret i6 %empty_11 } define weak i30 @_ssdm_op_PartSelect.i30.i32.i32.i32(i32, i32, i32) nounwind readnone { entry: %empty = call i32 @llvm.part.select.i32(i32 %0, i32 %1, i32 %2) %empty_12 = trunc i32 %empty to i30 ret i30 %empty_12 } declare i3 @_ssdm_op_PartSelect.i3.i4.i32.i32(i4, i32, i32) nounwind readnone declare i1 @_ssdm_op_PartSelect.i1.i7.i32.i32(i7, i32, i32) nounwind readnone define weak i5 @_ssdm_op_BitConcatenate.i5.i3.i2(i3, i2) nounwind readnone { entry: %empty = zext i3 %0 to i5 %empty_13 = zext i2 %1 to i5 %empty_14 = shl i5 %empty, 2 %empty_15 = or i5 %empty_14, %empty_13 ret i5 %empty_15 } !opencl.kernels = !{!0} !hls.encrypted.func = !{} !llvm.map.gv = !{} !axi4.master.portmap = !{!7} !axi4.slave.bundlemap = !{!8, !9, !10} !0 = metadata !{null, metadata !1, metadata !2, metadata !3, metadata !4, metadata !5, metadata !6} !1 = metadata !{metadata !"kernel_arg_addr_space", i32 1, i32 1, i32 1} !2 = metadata !{metadata !"kernel_arg_access_qual", metadata !"none", metadata !"none", metadata !"none"} !3 = metadata !{metadata !"kernel_arg_type", metadata !"int*", metadata !"int*", metadata !"int*"} !4 = metadata !{metadata !"kernel_arg_type_qual", metadata !"", metadata !"", metadata !""} !5 = metadata !{metadata !"kernel_arg_name", metadata !"A", metadata !"B", metadata !"result"} !6 = metadata !{metadata !"reqd_work_group_size", i32 1, i32 1, i32 1} !7 = metadata !{metadata !"gmem", metadata !"A", metadata !"READONLY", metadata !"B", metadata !"READONLY", metadata !"result", metadata !"WRITEONLY"} !8 = metadata !{metadata !"A", metadata !""} !9 = metadata !{metadata !"B", metadata !""} !10 = metadata !{metadata !"result", metadata !""} !11 = metadata !{metadata !12} !12 = metadata !{i32 0, i32 31, metadata !13} !13 = metadata !{metadata !14, metadata !17, metadata !18} !14 = metadata !{metadata !"A", metadata !15, metadata !"int", i32 0, i32 31} !15 = metadata !{metadata !16} !16 = metadata !{i32 0, i32 63, i32 1} !17 = metadata !{metadata !"B", metadata !15, metadata !"int", i32 0, i32 31} !18 = metadata !{metadata !"result", metadata !15, metadata !"int", i32 0, i32 31}