parallel lab 2022 spring hw1 SIMD arm cmd g++ -mcpu=apple-m1 neon.cpp -o test x86 cmd g++ main.cpp -o test.exe