_mm_load_ps1(float const* mem_addr);
dst[31:0] := MEM[mem_addr+31:mem_addr] dst[63:32] := MEM[mem_addr+31:mem_addr] dst[95:64] := MEM[mem_addr+31:mem_addr] dst[127:96] := MEM[mem_addr+31:mem_addr]