1[bits 64] 2blendpd xmm1, xmm2, 5 3blendpd xmm1, [0], 5 4 5blendps xmm1, xmm2, 5 6blendps xmm1, [0], 5 7 8blendvpd xmm1, xmm2 9blendvpd xmm1, xmm2, xmm0 10blendvpd xmm1, [0] 11blendvpd xmm1, [0], xmm0 12 13blendvps xmm1, xmm2 14blendvps xmm1, xmm2, xmm0 15blendvps xmm1, [0] 16blendvps xmm1, [0], xmm0 17 18crc32 eax, bl 19crc32 eax, bh 20crc32 eax, r9b 21crc32 eax, byte [0] 22crc32 eax, bx 23crc32 eax, word [0] 24crc32 eax, ebx 25crc32 eax, dword [0] 26 27crc32 r8d, bl 28;crc32 r8d, bh ; error 29crc32 r8d, r9b 30crc32 r8d, byte [0] 31crc32 r8d, bx 32crc32 r8d, word [0] 33crc32 r8d, ebx 34crc32 r8d, dword [0] 35 36crc32 rax, bl 37;crc32 rax, bh ; error 38crc32 rax, r9b 39crc32 rax, byte [0] 40crc32 rax, rbx 41crc32 rax, qword [0] 42 43dppd xmm1, xmm2, 5 44dppd xmm1, [0], 5 45 46dpps xmm1, xmm2, 5 47dpps xmm1, [0], 5 48 49extractps eax, xmm1, 5 50extractps [0], xmm1, 5 51extractps dword [0], xmm1, 5 52extractps r8d, xmm1, 5 53extractps rax, xmm1, 5 54 55insertps xmm1, xmm2, 5 56insertps xmm1, [0], 5 57insertps xmm1, dword [0], 5 58 59movntdqa xmm1, [0] 60movntdqa xmm1, dqword [0] 61 62mpsadbw xmm1, xmm2, 5 63mpsadbw xmm1, [0], 5 64 65packusdw xmm1, xmm2 66packusdw xmm1, [0] 67 68pblendvb xmm1, xmm2, xmm0 69pblendvb xmm1, [0], xmm0 70pblendvb xmm1, xmm2 71pblendvb xmm1, [0] 72 73pblendw xmm1, xmm2, 5 74pblendw xmm1, [0], 5 75 76pcmpeqq xmm1, xmm2 77pcmpeqq xmm1, [0] 78 79pcmpestri xmm1, xmm2, 5 80pcmpestri xmm1, [0], 5 81 82pcmpestrm xmm1, xmm2, 5 83pcmpestrm xmm1, [0], 5 84 85pcmpistri xmm1, xmm2, 5 86pcmpistri xmm1, [0], 5 87 88pcmpistrm xmm1, xmm2, 5 89pcmpistrm xmm1, [0], 5 90 91pcmpgtq xmm1, xmm2 92pcmpgtq xmm1, [0] 93 94pextrb eax, xmm1, 5 95pextrb rax, xmm1, 5 96pextrb [0], xmm1, 5 97pextrb byte [0], xmm1, 5 98 99pextrd eax, xmm1, 5 100pextrd [0], xmm1, 5 101pextrd dword [0], xmm1, 5 102pextrq rax, xmm1, 5 103pextrq qword [0], xmm1, 5 104 105; To get the SSE4 versions we need to disable the SSE2 versions 106cpu nosse2 107pextrw eax, xmm1, 5 108pextrw [0], xmm1, 5 109pextrw word [0], xmm1, 5 110pextrw rax, xmm1, 5 111 112phminposuw xmm1, xmm2 113phminposuw xmm1, [0] 114 115pinsrb xmm1, eax, 5 116pinsrb xmm1, [0], 5 117pinsrb xmm1, byte [0], 5 118 119pinsrd xmm1, eax, 5 120pinsrd xmm1, [0], 5 121pinsrd xmm1, dword [0], 5 122 123pinsrq xmm1, rax, 5 124pinsrq xmm1, [0], 5 125pinsrq xmm1, qword [0], 5 126 127pmaxsb xmm1, xmm2 128pmaxsb xmm1, [0] 129 130pmaxsd xmm1, xmm2 131pmaxsd xmm1, [0] 132 133pmaxud xmm1, xmm2 134pmaxud xmm1, [0] 135 136pmaxuw xmm1, xmm2 137pmaxuw xmm1, [0] 138 139pminsb xmm1, xmm2 140pminsb xmm1, [0] 141 142pminsd xmm1, xmm2 143pminsd xmm1, [0] 144 145pminud xmm1, xmm2 146pminud xmm1, [0] 147 148pminuw xmm1, xmm2 149pminuw xmm1, [0] 150 151pmovsxbw xmm1, xmm2 152pmovsxbw xmm1, [0] 153pmovsxbw xmm1, qword [0] 154 155pmovsxbd xmm1, xmm2 156pmovsxbd xmm1, [0] 157pmovsxbd xmm1, dword [0] 158 159pmovsxbq xmm1, xmm2 160pmovsxbq xmm1, [0] 161pmovsxbq xmm1, word [0] 162 163pmovsxwd xmm1, xmm2 164pmovsxwd xmm1, [0] 165pmovsxwd xmm1, qword [0] 166 167pmovsxwq xmm1, xmm2 168pmovsxwq xmm1, [0] 169pmovsxwq xmm1, dword [0] 170 171pmovsxdq xmm1, xmm2 172pmovsxdq xmm1, [0] 173pmovsxdq xmm1, qword [0] 174 175pmovzxbw xmm1, xmm2 176pmovzxbw xmm1, [0] 177pmovzxbw xmm1, qword [0] 178 179pmovzxbd xmm1, xmm2 180pmovzxbd xmm1, [0] 181pmovzxbd xmm1, dword [0] 182 183pmovzxbq xmm1, xmm2 184pmovzxbq xmm1, [0] 185pmovzxbq xmm1, word [0] 186 187pmovzxwd xmm1, xmm2 188pmovzxwd xmm1, [0] 189pmovzxwd xmm1, qword [0] 190 191pmovzxwq xmm1, xmm2 192pmovzxwq xmm1, [0] 193pmovzxwq xmm1, dword [0] 194 195pmovzxdq xmm1, xmm2 196pmovzxdq xmm1, [0] 197pmovzxdq xmm1, qword [0] 198 199pmuldq xmm1, xmm2 200pmuldq xmm1, [0] 201 202pmulld xmm1, xmm2 203pmulld xmm1, [0] 204 205popcnt ax, bx 206popcnt ax, [0] 207popcnt ebx, ecx 208popcnt ebx, [0] 209popcnt rcx, rdx 210popcnt rcx, [0] 211 212ptest xmm1, xmm2 213ptest xmm1, [0] 214 215roundpd xmm1, xmm2, 5 216roundpd xmm1, [0], 5 217 218roundps xmm1, xmm2, 5 219roundps xmm1, [0], 5 220 221roundsd xmm1, xmm2, 5 222roundsd xmm1, [0], 5 223 224roundss xmm1, xmm2, 5 225roundss xmm1, [0], 5 226 227