Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(189)

Side by Side Diff: src/trusted/validator_ragel/decoding.h

Issue 11000033: Move validator_x86_XX.rl out of unreviewed. (Closed) Base URL: svn://svn.chromium.org/native_client/trunk/src/native_client/
Patch Set: Created 7 years, 9 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch | Annotate | Revision Log
OLDNEW
1 /* 1 /*
2 * Copyright (c) 2012 The Native Client Authors. All rights reserved. 2 * Copyright (c) 2012 The Native Client Authors. All rights reserved.
3 * Use of this source code is governed by a BSD-style license that can be 3 * Use of this source code is governed by a BSD-style license that can be
4 * found in the LICENSE file. 4 * found in the LICENSE file.
5 */ 5 */
6 6
7 /* 7 /*
8 * This file contains common parts of x86-32 and x86-64 internals (inline 8 * This file contains common parts of ia32 and x86-64 decoder and validator
9 * functions and defines). 9 * internals (inline functions which are used to pull useful information from
10 * "well-known" bytes of the instruction: REX and VEX prefixes, ModR/M byte and
11 * so on).
10 * 12 *
11 * We only include simple schematic diagrams here. For full description see 13 * See full description in AMD/Intel manuals.
12 * AMD/Intel manuals.
13 */ 14 */
14 15
15 #ifndef NATIVE_CLIENT_SRC_TRUSTED_VALIDATOR_RAGEL_DECODING_H_ 16 #ifndef NATIVE_CLIENT_SRC_TRUSTED_VALIDATOR_RAGEL_DECODING_H_
16 #define NATIVE_CLIENT_SRC_TRUSTED_VALIDATOR_RAGEL_DECODING_H_ 17 #define NATIVE_CLIENT_SRC_TRUSTED_VALIDATOR_RAGEL_DECODING_H_
17 18
18 #include "native_client/src/trusted/validator_ragel/decoder.h" 19 #include "native_client/src/trusted/validator_ragel/decoder.h"
19 20
20 #if NACL_WINDOWS 21 #if NACL_WINDOWS
21 # define FORCEINLINE __forceinline 22 # define FORCEINLINE __forceinline
22 #else 23 #else
23 # define FORCEINLINE __inline __attribute__ ((always_inline)) 24 # define FORCEINLINE __inline __attribute__ ((always_inline))
24 #endif 25 #endif
25 26
26 27
27 /* 28 /*
28 * Opcode with register number embedded: 29 * Opcode-with-register byte format:
29 * 30 *
30 * 7 6 5 4 3 2 1 0 31 * bits 0-2: register number
31 * ┌───────┬───────┬───────┬───────┬───────┬───────┬───────┬───────┒ 32 * bits 3-7: actual opcode
32 * │ Opcode │ register number ┃
33 * ┕━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┛
34 */ 33 */
35 static FORCEINLINE uint8_t RegFromOpcode(uint8_t modrm) { 34 static FORCEINLINE uint8_t RegFromOpcode(uint8_t modrm) {
36 return modrm & 0x07; 35 return modrm & 0x07;
37 } 36 }
38 37
39 /* 38 /*
40 * ModRM byte format: 39 * ModRM byte format:
41 * 40 *
42 * 7 6 5 4 3 2 1 0 41 * bits 0-2: r/m
43 * ┌───────┬───────┬───────┬───────┬───────┬───────┬───────┬───────┒ 42 * bits 3-5: reg
44 * │ mod │ reg │ r/m ┃ 43 * bits 6-7: mod
45 * ┕━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┛
46 */ 44 */
47 static FORCEINLINE uint8_t ModFromModRM(uint8_t modrm) { 45 static FORCEINLINE uint8_t ModFromModRM(uint8_t modrm) {
48 return modrm >> 6; 46 return modrm >> 6;
49 } 47 }
50 48
51 static FORCEINLINE uint8_t RegFromModRM(uint8_t modrm) { 49 static FORCEINLINE uint8_t RegFromModRM(uint8_t modrm) {
52 return (modrm & 0x38) >> 3; 50 return (modrm >> 3) & 0x07;
53 } 51 }
54 52
55 static FORCEINLINE uint8_t RMFromModRM(uint8_t modrm) { 53 static FORCEINLINE uint8_t RMFromModRM(uint8_t modrm) {
56 return modrm & 0x07; 54 return modrm & 0x07;
57 } 55 }
58 56
59 /* 57 /*
60 * SIB byte format: 58 * SIB byte format:
61 * 59 *
62 * 7 6 5 4 3 2 1 0 60 * bits 0-2: base
63 * ┌───────┬───────┬───────┬───────┬───────┬───────┬───────┬───────┒ 61 * bits 3-5: index
64 * │ scale │ index │ base ┃ 62 * bits 6-7: scale
65 * ┕━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┛
66 */ 63 */
67 static FORCEINLINE uint8_t ScaleFromSIB(uint8_t sib) { 64 static FORCEINLINE uint8_t ScaleFromSIB(uint8_t sib) {
68 return sib >> 6; 65 return sib >> 6;
69 } 66 }
70 67
71 static FORCEINLINE uint8_t IndexFromSIB(uint8_t sib) { 68 static FORCEINLINE uint8_t IndexFromSIB(uint8_t sib) {
72 return (sib & 0x38) >> 3; 69 return (sib >> 3) & 0x07;
73 } 70 }
74 71
75 static FORCEINLINE uint8_t BaseFromSIB(uint8_t sib) { 72 static FORCEINLINE uint8_t BaseFromSIB(uint8_t sib) {
76 return sib & 0x07; 73 return sib & 0x07;
77 } 74 }
78 75
79 /* 76 /*
80 * REX byte format: 77 * REX byte format:
81 * 78 *
82 * 7 6 5 4 3 2 1 0 79 * bit 0: B (Base)
83 * ┌───────┬───────┬───────┬───────┬───────┬───────┬───────┬───────┒ 80 * bit 1: X (indeX)
84 * │ 0 │ 1 │ 0 │ 0 │ W │ R │ X │ B ┃ 81 * bit 2: R (Register)
85 * ┕━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┛ 82 * bit 3: W (Wide)
83 * 4-7 bits: 0x4 (REX signature)
86 */ 84 */
87 85
88 enum { 86 enum {
89 REX_B = 1, 87 REX_B = 1,
90 REX_X = 2, 88 REX_X = 2,
91 REX_R = 4, 89 REX_R = 4,
92 REX_W = 8 90 REX_W = 8
93 }; 91 };
94 92
93 /* How much to add to "base register" number: 0 or 8 */
95 static FORCEINLINE uint8_t BaseExtentionFromREX(uint8_t rex) { 94 static FORCEINLINE uint8_t BaseExtentionFromREX(uint8_t rex) {
96 return (rex & REX_B) << 3; 95 return (rex & REX_B) << 3;
97 } 96 }
98 97
98 /* How much to add to "index register" number: 0 or 8 */
99 static FORCEINLINE uint8_t IndexExtentionFromREX(uint8_t rex) { 99 static FORCEINLINE uint8_t IndexExtentionFromREX(uint8_t rex) {
100 return (rex & REX_X) << 2; 100 return (rex & REX_X) << 2;
101 } 101 }
102 102
103 /* How much to add to "register operand" number: 0 or 8 */
103 static FORCEINLINE uint8_t RegisterExtentionFromREX(uint8_t rex) { 104 static FORCEINLINE uint8_t RegisterExtentionFromREX(uint8_t rex) {
104 return (rex & REX_R) << 1; 105 return (rex & REX_R) << 1;
105 } 106 }
106 107
107 /* 108 /*
108 * VEX 2nd byte format: 109 * VEX 2nd byte format:
109 * 110 *
110 * 7 6 5 4 3 2 1 0 111 * 0-4 bits: opcode selector
111 * ┌───────┬───────┬───────┬───────┬───────┬───────┬───────┬───────┒ 112 * bit 5 bit: inverted B (Base)
112 * │ ¬R │ ¬X │ ¬B │ opcode map selector ┃ 113 * bit 6 bit: inverted X (indeX)
113 * ┕━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┛ 114 * bit 7 bit: inverted R (Register)
114 */ 115 */
115 116
116 enum { 117 enum {
117 VEX_MAP1 = 0x01, 118 VEX_MAP1 = 0x01,
118 VEX_MAP2 = 0x02, 119 VEX_MAP2 = 0x02,
119 VEX_MAP3 = 0x03, 120 VEX_MAP3 = 0x03,
120 VEX_MAP8 = 0x08, 121 VEX_MAP8 = 0x08,
121 VEX_MAP9 = 0x09, 122 VEX_MAP9 = 0x09,
122 VEX_MAPA = 0x0a, 123 VEX_MAPA = 0x0a,
123 VEX_B = 0x20, 124 VEX_B = 0x20,
124 VEX_X = 0x40, 125 VEX_X = 0x40,
125 VEX_R = 0x80, 126 VEX_R = 0x80,
126 VEX_W = 0x80 127 VEX_W = 0x80
halyavin 2013/03/25 09:43:41 Add a comment explaining that VEX_W is in the thir
khim 2013/03/25 11:33:48 Added separate enum for 3rd byte instead.
127 }; 128 };
128 129
129 static FORCEINLINE uint8_t BaseExtentionFromVEX(uint8_t vex2) { 130 static FORCEINLINE uint8_t BaseExtentionFromVEX(uint8_t vex2) {
halyavin 2013/03/25 09:43:41 Add comments similar to comments for REX prefixes.
khim 2013/03/25 11:33:48 Done.
130 return ((~vex2) & VEX_B) >> 2; 131 return ((~vex2) & VEX_B) >> 2;
131 } 132 }
132 133
133 static FORCEINLINE uint8_t IndexExtentionFromVEX(uint8_t vex2) { 134 static FORCEINLINE uint8_t IndexExtentionFromVEX(uint8_t vex2) {
134 return ((~vex2) & VEX_X) >> 3; 135 return ((~vex2) & VEX_X) >> 3;
135 } 136 }
136 137
137 static FORCEINLINE uint8_t RegisterExtentionFromVEX(uint8_t vex2) { 138 static FORCEINLINE uint8_t RegisterExtentionFromVEX(uint8_t vex2) {
138 return ((~vex2) & VEX_R) >> 4; 139 return ((~vex2) & VEX_R) >> 4;
139 } 140 }
140 141
141 /* 142 /*
142 * VEX 3rd byte format: 143 * VEX 3rd byte format:
143 * 144 *
144 * 7 6 5 4 3 2 1 0 145 * bits 0-1: pp (Packed Prefix)
145 * ┌───────┬───────┬───────┬───────┬───────┬───────┬───────┬───────┒ 146 * bit 2: L (Long)
146 * │ W │ ¬vvvv (register number) │ L │ pp ┃ 147 * bits 3-6: negated vvvv (register number)
147 * ┕━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┛ 148 * bit 7: W (Wide)
148 */ 149 */
149 150
150 static FORCEINLINE uint8_t GetOperandFromVexIA32(uint8_t vex3) { 151 static FORCEINLINE uint8_t GetOperandFromVexIA32(uint8_t vex3) {
151 return ((~vex3) & 0x38) >> 3; 152 return ((~vex3) >> 3) & 0x07;
152 } 153 }
153 154
154 static FORCEINLINE uint8_t GetOperandFromVexAMD64(uint8_t vex3) { 155 static FORCEINLINE uint8_t GetOperandFromVexAMD64(uint8_t vex3) {
155 return ((~vex3) & 0x78) >> 3; 156 return ((~vex3) >> 3) & 0x0f;
156 } 157 }
157 158
158 /* 159 /*
159 * is4 byte format: 160 * is4/is5 byte format:
160 * 161 *
161 * 7 6 5 4 3 2 1 0 162 * bits 0-1: imm2 or zero
162 * ┌───────┬───────┬───────┬───────┬───────┬───────┬───────┬───────┒ 163 * bits 2-3: 0
163 * │ vvvv (register number) │ 0 │ 0 │ imm2 or zero ┃ 164 * bits 4-7: register number
164 * ┕━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┷━━━━━━━┛
165 */ 165 */
166 static FORCEINLINE uint8_t RegisterFromIS4(uint8_t is4) { 166 static FORCEINLINE uint8_t RegisterFromIS4(uint8_t is4) {
167 return is4 >> 4; 167 return is4 >> 4;
168 } 168 }
169 169
170 /* 170 /*
171 * SignExtendXXBit is used to sign-extend XX-bit value to unsigned 64-bit value. 171 * SignExtendXXBit is used to sign-extend XX-bit value to unsigned 64-bit value.
172 * 172 *
173 * To do that you need to pass unsigned value of smaller then 64-bit size 173 * To do that you need to pass unsigned value of smaller then 64-bit size
174 * to this function: it will be converted to signed value and then 174 * to this function: it will be converted to signed value and then
175 * sign-extended to become 64-bit value. 175 * sign-extended to become 64-bit value.
176 * 176 *
177 * Smaller values can be obtained by restricting this value further (which is 177 * Return values can be restricted to smaller unsigned type when needed (which
178 * safe according to the C language specification: see 6.2.1.2 in C90 and 178 * is safe according to the C language specification: see 6.2.1.2 in C90 and
179 * 6.3.1.3.2 in C99 specification). 179 * 6.3.1.3.2 in C99 specification).
180 * 180 *
181 * Note that these operations are safe but slightly unusual: they come very 181 * Note that these operations are safe but slightly unusual: they come very
182 * close to the edge of what "well-behaved C program is not supposed to do", 182 * close to the edge of what "well-behaved C program is not supposed to do",
183 * but they stay on the "safe" side of this boundary. Specifically: this 183 * but they stay on the "safe" side of this boundary. Specifically: this
184 * behavior triggers "implementation-defined behavior" (see 6.2.1.2 in C90 184 * (conversion to intXX_t) behavior triggers "implementation-defined behavior"
185 * specification and 6.3.1.3.3 in C99 specification) which sounds suspiciously 185 * (see 6.2.1.2 in C90 specification and 6.3.1.3.3 in C99 specification) which
186 * similar to the dreaded "undefined behavior", but in reality these two are 186 * sounds suspiciously similar to the dreaded "undefined behavior", but in
187 * quite different: any program which triggers "undefined behavior" is not a 187 * reality these two are quite different: any program which triggers "undefined
188 * valid C program at all, but program which triggers "implementation-defined 188 * behavior" is not a valid C program at all, but program which triggers
189 * behavior" is quite valid C program. What this program actually *does* 189 * "implementation-defined behavior" is quite valid C program. What this
190 * depends on the specification of a given C compiler: each particular 190 * program actually *does* depends on the specification of a given C compiler:
191 * implementation must decide for itself what it'll do in this particular case 191 * each particular implementation must decide for itself what it'll do in this
192 * and *stick* *to* *it*. If the implementation uses two's-complement negative 192 * particular case and *stick* *to* *it*. If the implementation actually uses
193 * numbers (and all the implementation which can compile this code *must* 193 * two's-complement negative numbers (and all the implementation which can
194 * support two's-complement arythmetic - see 7.18.1.1 in C99 specification) then 194 * compile this code *must* support two's-complement arythmetic - see 7.18.1.1
195 * the easiest thing to do is to do what we need here - this is what all known 195 * in C99 specification) then the easiest thing to do is to do what we need
196 * compilers for all known platforms are actually doing. 196 * here - this is what all known compilers for all known platforms are actually
197 * doing.
198 *
199 * Conversion from intXX_t to uint64_t is always safe (same as before: see
200 * see 6.2.1.2 in C90 specification and 6.3.1.3.2 in C99 specification).
197 */ 201 */
198 static FORCEINLINE uint64_t SignExtend8Bit(uint64_t value) { 202 static FORCEINLINE uint64_t SignExtend8Bit(uint64_t value) {
199 return (int8_t)value; 203 return (int8_t)value;
200 } 204 }
201 205
202 static FORCEINLINE uint64_t SignExtend16Bit(uint64_t value) { 206 static FORCEINLINE uint64_t SignExtend16Bit(uint64_t value) {
203 return (int16_t)value; 207 return (int16_t)value;
204 } 208 }
205 209
206 static FORCEINLINE uint64_t SignExtend32Bit(uint64_t value) { 210 static FORCEINLINE uint64_t SignExtend32Bit(uint64_t value) {
(...skipping 19 matching lines...) Expand all
226 230
227 static const uint8_t index_registers[] = { 231 static const uint8_t index_registers[] = {
228 /* Note how REG_RIZ falls out of the pattern. */ 232 /* Note how REG_RIZ falls out of the pattern. */
229 REG_RAX, REG_RCX, REG_RDX, REG_RBX, 233 REG_RAX, REG_RCX, REG_RDX, REG_RBX,
230 REG_RIZ, REG_RBP, REG_RSI, REG_RDI, 234 REG_RIZ, REG_RBP, REG_RSI, REG_RDI,
231 REG_R8, REG_R9, REG_R10, REG_R11, 235 REG_R8, REG_R9, REG_R10, REG_R11,
232 REG_R12, REG_R13, REG_R14, REG_R15 236 REG_R12, REG_R13, REG_R14, REG_R15
233 }; 237 };
234 238
235 #endif /* NATIVE_CLIENT_SRC_TRUSTED_VALIDATOR_RAGEL_DECODING_H_ */ 239 #endif /* NATIVE_CLIENT_SRC_TRUSTED_VALIDATOR_RAGEL_DECODING_H_ */
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698