1*5971e316Smrg for (int c0 = 0; c0 < n - 31; c0 += 32) 2*5971e316Smrg for (int c1 = 0; c1 <= n; c1 += 32) { 3*5971e316Smrg if (n >= c1 + 32) { 4*5971e316Smrg for (int c2 = 0; c2 <= 31; c2 += 1) 5*5971e316Smrg for (int c3 = 0; c3 <= 31; c3 += 1) 6*5971e316Smrg S_1(c0 + c2, c1 + c3); 7*5971e316Smrg } else { 8*5971e316Smrg for (int c2 = 0; c2 <= 31; c2 += 1) { 9*5971e316Smrg for (int c3 = 0; c3 < n - c1; c3 += 1) 10*5971e316Smrg S_1(c0 + c2, c1 + c3); 11*5971e316Smrg S_2(c0 + c2); 12*5971e316Smrg } 13*5971e316Smrg } 14*5971e316Smrg } 15*5971e316Smrg for (int c1 = 0; c1 < n; c1 += 32) { 16*5971e316Smrg if (n >= c1 + 32) { 17*5971e316Smrg for (int c2 = 0; c2 < (n + 32) % 32; c2 += 1) 18*5971e316Smrg for (int c3 = 0; c3 <= 31; c3 += 1) 19*5971e316Smrg S_1(-((n + 32) % 32) + n + c2, c1 + c3); 20*5971e316Smrg } else { 21*5971e316Smrg for (int c2 = 0; c2 < n - c1; c2 += 1) { 22*5971e316Smrg for (int c3 = 0; c3 < n - c1; c3 += 1) 23*5971e316Smrg S_1(c1 + c2, c1 + c3); 24*5971e316Smrg S_2(c1 + c2); 25*5971e316Smrg } 26*5971e316Smrg } 27*5971e316Smrg } 28