Rev 2434 | Rev 3232 | Go to most recent revision | Only display areas with differences | Regard whitespace | Details | Blame | Last modification | View Log | RSS feed
Rev 2434 | Rev 2465 | ||
---|---|---|---|
1 | ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; |
1 | ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; |
2 | ;; ;; |
2 | ;; ;; |
3 | ;; Copyright (C) KolibriOS team 2004-2009. All rights reserved. ;; |
3 | ;; Copyright (C) KolibriOS team 2004-2011. All rights reserved. ;; |
4 | ;; Distributed under terms of the GNU General Public License ;; |
4 | ;; Distributed under terms of the GNU General Public License ;; |
5 | ;; ;; |
5 | ;; ;; |
6 | ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; |
6 | ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; |
7 | 7 | ||
8 | $Revision: 2434 $ |
8 | $Revision: 2465 $ |
9 | 9 | ||
10 | 10 | ||
11 | ; Small heap based on malloc/free/realloc written by Doug Lea |
11 | ; Small heap based on malloc/free/realloc written by Doug Lea |
12 | ; Version 2.8.3 Thu Sep 22 11:16:15 2005 Doug Lea (dl at gee) |
12 | ; Version 2.8.3 Thu Sep 22 11:16:15 2005 Doug Lea (dl at gee) |
13 | ; Source ftp://gee.cs.oswego.edu/pub/misc/malloc.c |
13 | ; Source ftp://gee.cs.oswego.edu/pub/misc/malloc.c |
14 | ; License http://creativecommons.org/licenses/publicdomain. |
14 | ; License http://creativecommons.org/licenses/publicdomain. |
15 | 15 | ||
16 | 16 | ||
17 | ; eax= size |
17 | ; eax= size |
18 | 18 | ||
19 | ; temp |
19 | ; temp |
20 | ; esi= nb |
20 | ; esi= nb |
21 | ; ebx= idx |
21 | ; ebx= idx |
22 | ; |
22 | ; |
23 | align 4 |
23 | align 4 |
24 | malloc: |
24 | malloc: |
25 | push esi |
25 | push esi |
26 | 26 | ||
27 | ; nb = ((size+7)&~7)+8; |
27 | ; nb = ((size+7)&~7)+8; |
28 | 28 | ||
29 | mov esi, eax ;size |
29 | mov esi, eax ;size |
30 | add esi, 7 |
30 | add esi, 7 |
31 | and esi, -8 |
31 | and esi, -8 |
32 | add esi, 8 |
32 | add esi, 8 |
33 | 33 | ||
34 | mov ecx, mst.mutex |
34 | mov ecx, mst.mutex |
35 | call mutex_lock |
35 | call mutex_lock |
36 | 36 | ||
37 | cmp esi, 256 |
37 | cmp esi, 256 |
38 | jae .large |
38 | jae .large |
39 | 39 | ||
40 | mov ecx, esi |
40 | mov ecx, esi |
41 | shr ecx, 3 |
41 | shr ecx, 3 |
42 | or eax, -1 |
42 | or eax, -1 |
43 | shl eax, cl |
43 | shl eax, cl |
44 | and eax, [mst.smallmap] |
44 | and eax, [mst.smallmap] |
45 | jz .small |
45 | jz .small |
46 | 46 | ||
47 | push ebp |
47 | push ebp |
48 | push edi |
48 | push edi |
49 | 49 | ||
50 | bsf eax, eax |
50 | bsf eax, eax |
51 | mov ebx, eax |
51 | mov ebx, eax |
52 | 52 | ||
53 | ; psize= idx<<3; |
53 | ; psize= idx<<3; |
54 | ; B = &ms.smallbins[idx]; |
54 | ; B = &ms.smallbins[idx]; |
55 | ; p = B->fd; |
55 | ; p = B->fd; |
56 | ; F = p->fd; |
56 | ; F = p->fd; |
57 | ; rsize= psize-nb; |
57 | ; rsize= psize-nb; |
58 | 58 | ||
59 | lea ebp, [eax*8] ;ebp= psize |
59 | lea ebp, [eax*8] ;ebp= psize |
60 | shl eax, 4 |
60 | shl eax, 4 |
61 | lea edi, [mst.smallbins+eax] ;edi= B |
61 | lea edi, [mst.smallbins+eax] ;edi= B |
62 | mov edx, [edi+8] ;edx= p |
62 | mov edx, [edi+8] ;edx= p |
63 | mov eax, [edx+8] ;eax= F |
63 | mov eax, [edx+8] ;eax= F |
64 | mov ecx, ebp |
64 | mov ecx, ebp |
65 | sub ecx, esi ;ecx= rsize |
65 | sub ecx, esi ;ecx= rsize |
66 | 66 | ||
67 | ; if (B == F) |
67 | ; if (B == F) |
68 | cmp edi, eax |
68 | cmp edi, eax |
69 | jne @F |
69 | jne @F |
70 | 70 | ||
71 | btr [mst.smallmap], ebx |
71 | btr [mst.smallmap], ebx |
72 | @@: |
72 | @@: |
73 | 73 | ||
74 | ; B->fd = F; |
74 | ; B->fd = F; |
75 | ; F->bk = B; |
75 | ; F->bk = B; |
76 | ; if(rsize<16) |
76 | ; if(rsize<16) |
77 | 77 | ||
78 | cmp ecx, 16 |
78 | cmp ecx, 16 |
79 | mov [edi+8], eax |
79 | mov [edi+8], eax |
80 | mov [eax+12], edi |
80 | mov [eax+12], edi |
81 | jae .split |
81 | jae .split |
82 | 82 | ||
83 | ; p->head = psize|PINUSE_BIT|CINUSE_BIT; |
83 | ; p->head = psize|PINUSE_BIT|CINUSE_BIT; |
84 | ; (p + psize)->head |= PINUSE_BIT; |
84 | ; (p + psize)->head |= PINUSE_BIT; |
85 | 85 | ||
86 | lea eax, [edx+8] |
86 | lea eax, [edx+8] |
87 | or dword [edx+ebp+4], 1 |
87 | or dword [edx+ebp+4], 1 |
88 | 88 | ||
89 | or ebp, 3 |
89 | or ebp, 3 |
90 | mov [edx+4], ebp |
90 | mov [edx+4], ebp |
91 | 91 | ||
92 | pop edi |
92 | pop edi |
93 | pop ebp |
93 | pop ebp |
94 | .done: |
94 | .done: |
95 | mov esi, eax |
95 | mov esi, eax |
96 | mov ecx, mst.mutex |
96 | mov ecx, mst.mutex |
97 | call mutex_unlock |
97 | call mutex_unlock |
98 | mov eax, esi |
98 | mov eax, esi |
99 | pop esi |
99 | pop esi |
100 | ret |
100 | ret |
101 | 101 | ||
102 | .split: |
102 | .split: |
103 | lea ebx, [edx+8] ;ebx=mem |
103 | lea ebx, [edx+8] ;ebx=mem |
104 | 104 | ||
105 | ; r = chunk_plus_offset(p, nb); |
105 | ; r = chunk_plus_offset(p, nb); |
106 | ; p->head = nb|PINUSE_BIT|CINUSE_BIT; |
106 | ; p->head = nb|PINUSE_BIT|CINUSE_BIT; |
107 | ; r->head = rsize|PINUSE_BIT; |
107 | ; r->head = rsize|PINUSE_BIT; |
108 | 108 | ||
109 | lea eax, [edx+esi] ;eax= r |
109 | lea eax, [edx+esi] ;eax= r |
110 | or esi, 3 |
110 | or esi, 3 |
111 | mov [edx+4], esi |
111 | mov [edx+4], esi |
112 | 112 | ||
113 | mov edx, ecx |
113 | mov edx, ecx |
114 | or edx, 1 |
114 | or edx, 1 |
115 | mov [eax+4], edx |
115 | mov [eax+4], edx |
116 | 116 | ||
117 | ; (r + rsize)->prev_foot = rsize; |
117 | ; (r + rsize)->prev_foot = rsize; |
118 | 118 | ||
119 | mov [eax+ecx], ecx |
119 | mov [eax+ecx], ecx |
120 | 120 | ||
121 | ; I = rsize>>3; |
121 | ; I = rsize>>3; |
122 | 122 | ||
123 | shr ecx, 3 |
123 | shr ecx, 3 |
124 | 124 | ||
125 | ; ms.smallmap |= 1<< I; |
125 | ; ms.smallmap |= 1<< I; |
126 | bts [mst.smallmap], ecx |
126 | bts [mst.smallmap], ecx |
127 | 127 | ||
128 | ; B = &ms.smallbins[I]; |
128 | ; B = &ms.smallbins[I]; |
129 | 129 | ||
130 | shl ecx, 4 |
130 | shl ecx, 4 |
131 | pop edi |
131 | pop edi |
132 | pop ebp |
132 | pop ebp |
133 | add ecx, mst.smallbins ;ecx= B |
133 | add ecx, mst.smallbins ;ecx= B |
134 | 134 | ||
135 | mov edx, [ecx+8] ; F = B->fd; |
135 | mov edx, [ecx+8] ; F = B->fd; |
136 | mov [ecx+8], eax ; B->fd = r; |
136 | mov [ecx+8], eax ; B->fd = r; |
137 | mov [edx+12], eax ; F->bk = r; |
137 | mov [edx+12], eax ; F->bk = r; |
138 | mov [eax+8], edx ; r->fd = F; |
138 | mov [eax+8], edx ; r->fd = F; |
139 | mov [eax+12], ecx ; r->bk = B; |
139 | mov [eax+12], ecx ; r->bk = B; |
140 | 140 | ||
141 | mov eax, ebx |
141 | mov eax, ebx |
142 | jmp .done |
142 | jmp .done |
143 | 143 | ||
144 | .small: |
144 | .small: |
145 | 145 | ||
146 | ; if (ms.treemap != 0 && (mem = malloc_small(nb)) != 0) |
146 | ; if (ms.treemap != 0 && (mem = malloc_small(nb)) != 0) |
147 | ;;;;;;;;;;; start a change |
147 | ;;;;;;;;;;; start a change |
148 | mov eax, [mst.treemap] |
148 | mov eax, [mst.treemap] |
149 | test eax, eax |
149 | test eax, eax |
150 | ;;;;;;;;;;; end the change |
150 | ;;;;;;;;;;; end the change |
151 | ; cmp [mst.treemap], 0 |
151 | ; cmp [mst.treemap], 0 |
152 | jz .from_top |
152 | jz .from_top |
153 | mov eax, esi |
153 | mov eax, esi |
154 | call malloc_small |
154 | call malloc_small |
155 | test eax, eax |
155 | test eax, eax |
156 | jz .from_top |
156 | jz .from_top |
157 | jmp .done |
157 | jmp .done |
158 | 158 | ||
159 | .large: |
159 | .large: |
160 | 160 | ||
161 | ; if (ms.treemap != 0 && (mem = malloc_large(nb)) != 0) |
161 | ; if (ms.treemap != 0 && (mem = malloc_large(nb)) != 0) |
162 | 162 | ||
163 | cmp [mst.treemap], 0 |
163 | cmp [mst.treemap], 0 |
164 | je .from_top |
164 | je .from_top |
165 | 165 | ||
166 | call malloc_large ;esi= nb |
166 | call malloc_large ;esi= nb |
167 | test eax, eax |
167 | test eax, eax |
168 | jne .done |
168 | jne .done |
169 | .from_top: |
169 | .from_top: |
170 | 170 | ||
171 | ; if (nb < ms.topsize) |
171 | ; if (nb < ms.topsize) |
172 | 172 | ||
173 | mov eax, [mst.topsize] |
173 | mov eax, [mst.topsize] |
174 | cmp esi, eax |
174 | cmp esi, eax |
175 | jae .fail |
175 | jae .fail |
176 | 176 | ||
177 | ; rsize = ms.topsize -= nb; |
177 | ; rsize = ms.topsize -= nb; |
178 | ; p = ms.top; |
178 | ; p = ms.top; |
179 | 179 | ||
180 | mov ecx, [mst.top] |
180 | mov ecx, [mst.top] |
181 | sub eax, esi |
181 | sub eax, esi |
182 | mov [mst.topsize], eax |
182 | mov [mst.topsize], eax |
183 | 183 | ||
184 | ; r = ms.top = chunk_plus_offset(p, nb); |
184 | ; r = ms.top = chunk_plus_offset(p, nb); |
185 | ; r->head = rsize | PINUSE_BIT; |
185 | ; r->head = rsize | PINUSE_BIT; |
186 | ; p->head = nb |PINUSE_BIT|CINUSE_BIT; |
186 | ; p->head = nb |PINUSE_BIT|CINUSE_BIT; |
187 | 187 | ||
188 | lea edx, [ecx+esi] |
188 | lea edx, [ecx+esi] |
189 | or eax, 1 |
189 | or eax, 1 |
190 | mov [mst.top], edx |
190 | mov [mst.top], edx |
191 | or esi, 3 |
191 | or esi, 3 |
192 | mov [edx+4], eax |
192 | mov [edx+4], eax |
193 | mov [ecx+4], esi |
193 | mov [ecx+4], esi |
194 | lea eax, [ecx+8] |
194 | lea eax, [ecx+8] |
195 | jmp .done |
195 | jmp .done |
196 | 196 | ||
197 | .fail: |
197 | .fail: |
198 | xor eax, eax |
198 | xor eax, eax |
199 | jmp .done |
199 | jmp .done |
200 | 200 | ||
201 | ; param |
201 | ; param |
202 | ; eax= mem |
202 | ; eax= mem |
203 | align 4 |
203 | align 4 |
204 | free: |
204 | free: |
205 | test eax, eax |
205 | test eax, eax |
206 | jz .exit |
206 | jz .exit |
207 | 207 | ||
208 | push edi |
208 | push edi |
209 | mov edi, eax |
209 | mov edi, eax |
210 | add edi, -8 |
210 | add edi, -8 |
211 | 211 | ||
212 | ; if(p->head & CINUSE_BIT) |
212 | ; if(p->head & CINUSE_BIT) |
213 | 213 | ||
214 | test byte [edi+4], 2 |
214 | test byte [edi+4], 2 |
215 | je .fail |
215 | je .fail |
216 | 216 | ||
217 | mov ecx, mst.mutex |
217 | mov ecx, mst.mutex |
218 | call mutex_lock |
218 | call mutex_lock |
219 | 219 | ||
220 | ; psize = p->head & (~3); |
220 | ; psize = p->head & (~3); |
221 | 221 | ||
222 | mov eax, [edi+4] |
222 | mov eax, [edi+4] |
223 | push esi |
223 | push esi |
224 | mov esi, eax |
224 | mov esi, eax |
225 | and esi, -4 |
225 | and esi, -4 |
226 | 226 | ||
227 | ; next = chunk_plus_offset(p, psize); |
227 | ; next = chunk_plus_offset(p, psize); |
228 | ; if(!(p->head & PINUSE_BIT)) |
228 | ; if(!(p->head & PINUSE_BIT)) |
229 | 229 | ||
230 | test al, 1 |
230 | test al, 1 |
231 | lea ebx, [esi+edi] |
231 | lea ebx, [esi+edi] |
232 | jne .next |
232 | jne .next |
233 | 233 | ||
234 | ; prevsize = p->prev_foot; |
234 | ; prevsize = p->prev_foot; |
235 | ; prev=p - prevsize; |
235 | ; prev=p - prevsize; |
236 | ; psize += prevsize; |
236 | ; psize += prevsize; |
237 | ; p = prev; |
237 | ; p = prev; |
238 | 238 | ||
239 | mov ecx, [edi] ;ecx= prevsize |
239 | mov ecx, [edi] ;ecx= prevsize |
240 | add esi, ecx ;esi= psize |
240 | add esi, ecx ;esi= psize |
241 | sub edi, ecx ;edi= p |
241 | sub edi, ecx ;edi= p |
242 | 242 | ||
243 | ; if (prevsize < 256) |
243 | ; if (prevsize < 256) |
244 | 244 | ||
245 | cmp ecx, 256 |
245 | cmp ecx, 256 |
246 | jae .unlink_large |
246 | jae .unlink_large |
247 | 247 | ||
248 | mov eax, [edi+8] ;F = p->fd; |
248 | mov eax, [edi+8] ;F = p->fd; |
249 | mov edx, [edi+12] ;B = p->bk; |
249 | mov edx, [edi+12] ;B = p->bk; |
250 | 250 | ||
251 | ; if (F == B) |
251 | ; if (F == B) |
252 | ; ms.smallmap &= ~(1<< I); |
252 | ; ms.smallmap &= ~(1<< I); |
253 | shr ecx, 3 |
253 | shr ecx, 3 |
254 | cmp eax, edx |
254 | cmp eax, edx |
255 | jne @F |
255 | jne @F |
256 | btr [mst.smallmap], ecx |
256 | btr [mst.smallmap], ecx |
257 | @@: |
257 | @@: |
258 | mov [eax+12], edx ;F->bk = B; |
258 | mov [eax+12], edx ;F->bk = B; |
259 | mov [edx+8], eax ;B->fd = F |
259 | mov [edx+8], eax ;B->fd = F |
260 | jmp .next |
260 | jmp .next |
261 | .unlink_large: |
261 | .unlink_large: |
262 | mov edx, edi |
262 | mov edx, edi |
263 | call unlink_large_chunk |
263 | call unlink_large_chunk |
264 | .next: |
264 | .next: |
265 | 265 | ||
266 | ; if(next->head & PINUSE_BIT) |
266 | ; if(next->head & PINUSE_BIT) |
267 | 267 | ||
268 | mov eax, [ebx+4] |
268 | mov eax, [ebx+4] |
269 | test al, 1 |
269 | test al, 1 |
270 | jz .fail2 |
270 | jz .fail2 |
271 | 271 | ||
272 | ; if (! (next->head & CINUSE_BIT)) |
272 | ; if (! (next->head & CINUSE_BIT)) |
273 | 273 | ||
274 | test al, 2 |
274 | test al, 2 |
275 | jnz .fix_next |
275 | jnz .fix_next |
276 | 276 | ||
277 | ; if (next == ms.top) |
277 | ; if (next == ms.top) |
278 | 278 | ||
279 | cmp ebx, [mst.top] |
279 | cmp ebx, [mst.top] |
280 | jne @F |
280 | jne @F |
281 | 281 | ||
282 | ; tsize = ms.topsize += psize; |
282 | ; tsize = ms.topsize += psize; |
283 | 283 | ||
284 | mov eax, [mst.topsize] |
284 | mov eax, [mst.topsize] |
285 | add eax, esi |
285 | add eax, esi |
286 | mov [mst.topsize], eax |
286 | mov [mst.topsize], eax |
287 | 287 | ||
288 | ; ms.top = p; |
288 | ; ms.top = p; |
289 | ; p->head = tsize | PINUSE_BIT; |
289 | ; p->head = tsize | PINUSE_BIT; |
290 | 290 | ||
291 | or eax, 1 |
291 | or eax, 1 |
292 | mov [mst.top], edi |
292 | mov [mst.top], edi |
293 | mov [edi+4], eax |
293 | mov [edi+4], eax |
294 | .fail2: |
294 | .fail2: |
295 | mov esi, eax |
295 | mov esi, eax |
296 | mov ecx, mst.mutex |
296 | mov ecx, mst.mutex |
297 | call mutex_unlock |
297 | call mutex_unlock |
298 | mov eax, esi |
298 | mov eax, esi |
299 | pop esi |
299 | pop esi |
300 | .fail: |
300 | .fail: |
301 | pop edi |
301 | pop edi |
302 | .exit: |
302 | .exit: |
303 | ret |
303 | ret |
304 | 304 | ||
305 | @@: |
305 | @@: |
306 | 306 | ||
307 | ; nsize = next->head & ~INUSE_BITS; |
307 | ; nsize = next->head & ~INUSE_BITS; |
308 | 308 | ||
309 | and eax, -4 |
309 | and eax, -4 |
310 | add esi, eax ;psize += nsize; |
310 | add esi, eax ;psize += nsize; |
311 | 311 | ||
312 | ; if (nsize < 256) |
312 | ; if (nsize < 256) |
313 | 313 | ||
314 | cmp eax, 256 |
314 | cmp eax, 256 |
315 | jae .unl_large |
315 | jae .unl_large |
316 | 316 | ||
317 | mov edx, [ebx+8] ;F = next->fd |
317 | mov edx, [ebx+8] ;F = next->fd |
318 | mov ebx, [ebx+12] ;B = next->bk |
318 | mov ebx, [ebx+12] ;B = next->bk |
319 | 319 | ||
320 | ; if (F == B) |
320 | ; if (F == B) |
321 | 321 | ||
322 | cmp edx, ebx |
322 | cmp edx, ebx |
323 | jne @F |
323 | jne @F |
324 | mov ecx, eax |
324 | mov ecx, eax |
325 | shr ecx, 3 |
325 | shr ecx, 3 |
326 | btr [mst.smallmap], ecx |
326 | btr [mst.smallmap], ecx |
327 | @@: |
327 | @@: |
328 | mov [edx+12], ebx ;F->bk = B |
328 | mov [edx+12], ebx ;F->bk = B |
329 | 329 | ||
330 | ; p->head = psize|PINUSE_BIT; |
330 | ; p->head = psize|PINUSE_BIT; |
331 | 331 | ||
332 | mov ecx, esi |
332 | mov ecx, esi |
333 | mov [ebx+8], edx |
333 | mov [ebx+8], edx |
334 | or ecx, 1 |
334 | or ecx, 1 |
335 | mov [edi+4], ecx |
335 | mov [edi+4], ecx |
336 | 336 | ||
337 | ; (p+psize)->prev_foot = psize; |
337 | ; (p+psize)->prev_foot = psize; |
338 | 338 | ||
339 | mov [esi+edi], esi |
339 | mov [esi+edi], esi |
340 | 340 | ||
341 | ; insert_chunk(p,psize); |
341 | ; insert_chunk(p,psize); |
342 | 342 | ||
343 | mov eax, esi |
343 | mov eax, esi |
344 | pop esi |
344 | pop esi |
345 | mov ecx, edi |
345 | mov ecx, edi |
346 | pop edi |
346 | pop edi |
347 | jmp insert_chunk |
347 | jmp insert_chunk |
348 | .unl_large: |
348 | .unl_large: |
349 | 349 | ||
350 | ; unlink_large_chunk((tchunkptr)next); |
350 | ; unlink_large_chunk((tchunkptr)next); |
351 | 351 | ||
352 | mov edx, ebx |
352 | mov edx, ebx |
353 | call unlink_large_chunk |
353 | call unlink_large_chunk |
354 | ; p->head = psize|PINUSE_BIT; |
354 | ; p->head = psize|PINUSE_BIT; |
355 | 355 | ||
356 | mov ecx, esi |
356 | mov ecx, esi |
357 | or ecx, 1 |
357 | or ecx, 1 |
358 | mov [edi+4], ecx |
358 | mov [edi+4], ecx |
359 | 359 | ||
360 | ; (p+psize)->prev_foot = psize; |
360 | ; (p+psize)->prev_foot = psize; |
361 | 361 | ||
362 | mov [esi+edi], esi |
362 | mov [esi+edi], esi |
363 | 363 | ||
364 | ; insert_chunk(p,psize); |
364 | ; insert_chunk(p,psize); |
365 | 365 | ||
366 | mov eax, esi |
366 | mov eax, esi |
367 | pop esi |
367 | pop esi |
368 | mov ecx, edi |
368 | mov ecx, edi |
369 | pop edi |
369 | pop edi |
370 | jmp insert_chunk |
370 | jmp insert_chunk |
371 | .fix_next: |
371 | .fix_next: |
372 | 372 | ||
373 | ; (p+psize)->prev_foot = psize; |
373 | ; (p+psize)->prev_foot = psize; |
374 | ; next->head &= ~PINUSE_BIT; |
374 | ; next->head &= ~PINUSE_BIT; |
375 | ; p->head = psize|PINUSE_BIT; |
375 | ; p->head = psize|PINUSE_BIT; |
376 | 376 | ||
377 | and eax, -2 |
377 | and eax, -2 |
378 | mov edx, esi |
378 | mov edx, esi |
379 | mov [ebx+4], eax |
379 | mov [ebx+4], eax |
380 | or edx, 1 |
380 | or edx, 1 |
381 | mov [edi+4], edx |
381 | mov [edi+4], edx |
382 | 382 | ||
383 | ; (p+psize)->prev_foot = psize; |
383 | ; (p+psize)->prev_foot = psize; |
384 | 384 | ||
385 | mov [esi+edi], esi |
385 | mov [esi+edi], esi |
386 | ; insert_chunk(p,psize); |
386 | ; insert_chunk(p,psize); |
387 | 387 | ||
388 | mov eax, esi |
388 | mov eax, esi |
389 | pop esi |
389 | pop esi |
390 | mov ecx, edi |
390 | mov ecx, edi |
391 | pop edi |
391 | pop edi |
392 | jmp insert_chunk |
392 | jmp insert_chunk |
393 | 393 | ||
394 | ; param |
394 | ; param |
395 | ; ecx = chunk |
395 | ; ecx = chunk |
396 | ; eax = size |
396 | ; eax = size |
397 | 397 | ||
398 | insert_chunk: |
398 | insert_chunk: |
399 | 399 | ||
400 | cmp eax, 256 |
400 | cmp eax, 256 |
401 | push esi |
401 | push esi |
402 | mov esi, ecx |
402 | mov esi, ecx |
403 | jae .large |
403 | jae .large |
404 | 404 | ||
405 | ; I = S>>3; |
405 | ; I = S>>3; |
406 | ; ms.smallmap |= 1<< I; |
406 | ; ms.smallmap |= 1<< I; |
407 | 407 | ||
408 | shr eax, 3 |
408 | shr eax, 3 |
409 | bts [mst.smallmap], eax |
409 | bts [mst.smallmap], eax |
410 | 410 | ||
411 | ; B = &ms.smallbins[I]; |
411 | ; B = &ms.smallbins[I]; |
412 | 412 | ||
413 | shl eax, 4 |
413 | shl eax, 4 |
414 | add eax, mst.smallbins |
414 | add eax, mst.smallbins |
415 | mov edx, [eax+8] ;F = B->fd |
415 | mov edx, [eax+8] ;F = B->fd |
416 | mov [eax+8], esi ;B->fd = P |
416 | mov [eax+8], esi ;B->fd = P |
417 | mov [edx+12], esi ;F->bk = P |
417 | mov [edx+12], esi ;F->bk = P |
418 | mov [esi+8], edx ;P->fd = F |
418 | mov [esi+8], edx ;P->fd = F |
419 | mov [esi+12], eax ;P->bk = B |
419 | mov [esi+12], eax ;P->bk = B |
420 | pop esi |
420 | pop esi |
421 | mov ecx, mst.mutex |
421 | mov ecx, mst.mutex |
422 | call mutex_unlock |
422 | call mutex_unlock |
423 | ret |
423 | ret |
424 | .large: |
424 | .large: |
425 | mov ebx, eax |
425 | mov ebx, eax |
426 | call insert_large_chunk |
426 | call insert_large_chunk |
427 | pop esi |
427 | pop esi |
428 | mov ecx, mst.mutex |
428 | mov ecx, mst.mutex |
429 | call mutex_unlock |
429 | call mutex_unlock |
430 | ret |
430 | ret |
431 | 431 | ||
432 | 432 | ||
433 | ; param |
433 | ; param |
434 | ; esi= chunk |
434 | ; esi= chunk |
435 | ; ebx= size |
435 | ; ebx= size |
436 | 436 | ||
437 | insert_large_chunk: |
437 | insert_large_chunk: |
438 | 438 | ||
439 | ; I = compute_tree_index(S); |
439 | ; I = compute_tree_index(S); |
440 | 440 | ||
441 | mov edx, ebx |
441 | mov edx, ebx |
442 | shr edx, 8 |
442 | shr edx, 8 |
443 | bsr eax, edx |
443 | bsr eax, edx |
444 | lea ecx, [eax+7] |
444 | lea ecx, [eax+7] |
445 | mov edx, ebx |
445 | mov edx, ebx |
446 | shr edx, cl |
446 | shr edx, cl |
447 | and edx, 1 |
447 | and edx, 1 |
448 | lea ecx, [edx+eax*2] |
448 | lea ecx, [edx+eax*2] |
449 | 449 | ||
450 | ; X->index = I; |
450 | ; X->index = I; |
451 | mov dword [esi+28], ecx |
451 | mov dword [esi+28], ecx |
452 | 452 | ||
453 | ; X->child[0] = X->child[1] = 0; |
453 | ; X->child[0] = X->child[1] = 0; |
454 | and dword [esi+20], 0 |
454 | and dword [esi+20], 0 |
455 | and dword [esi+16], 0 |
455 | and dword [esi+16], 0 |
456 | 456 | ||
457 | ; H = &ms.treebins[I]; |
457 | ; H = &ms.treebins[I]; |
458 | 458 | ||
459 | mov eax, ecx |
459 | mov eax, ecx |
460 | lea edx, [mst.treebins+eax*4] |
460 | lea edx, [mst.treebins+eax*4] |
461 | 461 | ||
462 | ; if (!(ms.treemap & 1< |
462 | ; if (!(ms.treemap & 1< |
463 | bt [mst.treemap], ecx |
463 | bt [mst.treemap], ecx |
464 | jc .tree |
464 | jc .tree |
465 | 465 | ||
466 | ; ms.treemap |= 1< |
466 | ; ms.treemap |= 1< |
467 | bts [mst.treemap], ecx |
467 | bts [mst.treemap], ecx |
468 | ; *H = X; |
468 | ; *H = X; |
469 | mov dword [edx], esi |
469 | mov dword [edx], esi |
470 | jmp .done |
470 | jmp .done |
471 | .tree: |
471 | .tree: |
472 | 472 | ||
473 | ; T = *H; |
473 | ; T = *H; |
474 | mov edx, [edx] |
474 | mov edx, [edx] |
475 | 475 | ||
476 | ; K = S << leftshift_for_tree_index(I); |
476 | ; K = S << leftshift_for_tree_index(I); |
477 | mov eax, ecx |
477 | mov eax, ecx |
478 | shr eax, 1 |
478 | shr eax, 1 |
479 | sub ecx, 31 |
479 | sub ecx, 31 |
480 | mov edi, 37 |
480 | mov edi, 37 |
481 | sub edi, eax |
481 | sub edi, eax |
482 | neg ecx |
482 | neg ecx |
483 | sbb ecx, ecx |
483 | sbb ecx, ecx |
484 | and ecx, edi |
484 | and ecx, edi |
485 | mov eax, ebx |
485 | mov eax, ebx |
486 | shl eax, cl ;eax= K |
486 | shl eax, cl ;eax= K |
487 | 487 | ||
488 | jmp .loop |
488 | jmp .loop |
489 | .not_eq_size: |
489 | .not_eq_size: |
490 | 490 | ||
491 | ; C = &(T->child[(K >> 31) & 1]); |
491 | ; C = &(T->child[(K >> 31) & 1]); |
492 | mov ecx, eax |
492 | mov ecx, eax |
493 | shr ecx, 31 |
493 | shr ecx, 31 |
494 | lea ecx, [edx+ecx*4+16] |
494 | lea ecx, [edx+ecx*4+16] |
495 | 495 | ||
496 | ; K <<= 1; |
496 | ; K <<= 1; |
497 | ; if (*C != 0) |
497 | ; if (*C != 0) |
498 | mov edi, [ecx] |
498 | mov edi, [ecx] |
499 | add eax, eax |
499 | add eax, eax |
500 | test edi, edi |
500 | test edi, edi |
501 | jz .insert_child |
501 | jz .insert_child |
502 | 502 | ||
503 | ; T = *C; |
503 | ; T = *C; |
504 | mov edx, edi |
504 | mov edx, edi |
505 | .loop: |
505 | .loop: |
506 | 506 | ||
507 | ; for (;;) |
507 | ; for (;;) |
508 | ; if ((T->head & ~INUSE_BITS) != S) |
508 | ; if ((T->head & ~INUSE_BITS) != S) |
509 | 509 | ||
510 | mov ecx, [edx+4] |
510 | mov ecx, [edx+4] |
511 | and ecx, not 3 |
511 | and ecx, not 3 |
512 | cmp ecx, ebx |
512 | cmp ecx, ebx |
513 | jne .not_eq_size |
513 | jne .not_eq_size |
514 | 514 | ||
515 | ; F = T->fd; |
515 | ; F = T->fd; |
516 | mov eax, [edx+8] |
516 | mov eax, [edx+8] |
517 | 517 | ||
518 | ; T->fd = F->bk = X; |
518 | ; T->fd = F->bk = X; |
519 | mov [eax+12], esi |
519 | mov [eax+12], esi |
520 | mov [edx+8], esi |
520 | mov [edx+8], esi |
521 | 521 | ||
522 | ; X->fd = F; |
522 | ; X->fd = F; |
523 | ; X->bk = T; |
523 | ; X->bk = T; |
524 | ; X->parent = 0; |
524 | ; X->parent = 0; |
525 | 525 | ||
526 | and dword [esi+24], 0 |
526 | and dword [esi+24], 0 |
527 | mov [esi+8], eax |
527 | mov [esi+8], eax |
528 | mov [esi+12], edx |
528 | mov [esi+12], edx |
529 | ret |
529 | ret |
530 | .insert_child: |
530 | .insert_child: |
531 | 531 | ||
532 | ; *C = X; |
532 | ; *C = X; |
533 | mov [ecx], esi |
533 | mov [ecx], esi |
534 | .done: |
534 | .done: |
535 | 535 | ||
536 | ; X->parent = T; |
536 | ; X->parent = T; |
537 | mov [esi+24], edx |
537 | mov [esi+24], edx |
538 | 538 | ||
539 | ; X->fd = X->bk = X; |
539 | ; X->fd = X->bk = X; |
540 | mov [esi+12], esi |
540 | mov [esi+12], esi |
541 | mov [esi+8], esi |
541 | mov [esi+8], esi |
542 | ret |
542 | ret |
543 | 543 | ||
544 | 544 | ||
545 | ; param |
545 | ; param |
546 | ; edx= chunk |
546 | ; edx= chunk |
547 | 547 | ||
548 | unlink_large_chunk: |
548 | unlink_large_chunk: |
549 | 549 | ||
550 | mov eax, [edx+12] |
550 | mov eax, [edx+12] |
551 | cmp eax, edx |
551 | cmp eax, edx |
552 | push edi |
552 | push edi |
553 | mov edi, [edx+24] |
553 | mov edi, [edx+24] |
554 | je @F |
554 | je @F |
555 | 555 | ||
556 | mov ecx, [edx+8] ;F = X->fd |
556 | mov ecx, [edx+8] ;F = X->fd |
557 | mov [ecx+12], eax ;F->bk = R; |
557 | mov [ecx+12], eax ;F->bk = R; |
558 | mov [eax+8], ecx ;R->fd = F |
558 | mov [eax+8], ecx ;R->fd = F |
559 | jmp .parent |
559 | jmp .parent |
560 | @@: |
560 | @@: |
561 | mov eax, [edx+20] |
561 | mov eax, [edx+20] |
562 | test eax, eax |
562 | test eax, eax |
563 | push esi |
563 | push esi |
564 | lea esi, [edx+20] |
564 | lea esi, [edx+20] |
565 | jne .loop |
565 | jne .loop |
566 | 566 | ||
567 | mov eax, [edx+16] |
567 | mov eax, [edx+16] |
568 | test eax, eax |
568 | test eax, eax |
569 | lea esi, [edx+16] |
569 | lea esi, [edx+16] |
570 | je .l2 |
570 | je .l2 |
571 | .loop: |
571 | .loop: |
572 | cmp dword [eax+20], 0 |
572 | cmp dword [eax+20], 0 |
573 | lea ecx, [eax+20] |
573 | lea ecx, [eax+20] |
574 | jne @F |
574 | jne @F |
575 | 575 | ||
576 | cmp dword [eax+16], 0 |
576 | cmp dword [eax+16], 0 |
577 | lea ecx, [eax+16] |
577 | lea ecx, [eax+16] |
578 | je .l1 |
578 | je .l1 |
579 | @@: |
579 | @@: |
580 | mov eax, [ecx] |
580 | mov eax, [ecx] |
581 | mov esi, ecx |
581 | mov esi, ecx |
582 | jmp .loop |
582 | jmp .loop |
583 | .l1: |
583 | .l1: |
584 | mov dword [esi], 0 |
584 | mov dword [esi], 0 |
585 | .l2: |
585 | .l2: |
586 | pop esi |
586 | pop esi |
587 | .parent: |
587 | .parent: |
588 | test edi, edi |
588 | test edi, edi |
589 | je .done |
589 | je .done |
590 | 590 | ||
591 | mov ecx, [edx+28] |
591 | mov ecx, [edx+28] |
592 | cmp edx, [mst.treebins+ecx*4] |
592 | cmp edx, [mst.treebins+ecx*4] |
593 | lea ecx, [mst.treebins+ecx*4] |
593 | lea ecx, [mst.treebins+ecx*4] |
594 | jne .l3 |
594 | jne .l3 |
595 | 595 | ||
596 | test eax, eax |
596 | test eax, eax |
597 | mov [ecx], eax |
597 | mov [ecx], eax |
598 | jne .l5 |
598 | jne .l5 |
599 | 599 | ||
600 | mov ecx, [edx+28] |
600 | mov ecx, [edx+28] |
601 | btr [mst.treemap], ecx |
601 | btr [mst.treemap], ecx |
602 | pop edi |
602 | pop edi |
603 | ret |
603 | ret |
604 | 604 | ||
605 | .l3: |
605 | .l3: |
606 | cmp [edi+16], edx |
606 | cmp [edi+16], edx |
607 | jne @F |
607 | jne @F |
608 | 608 | ||
609 | mov [edi+16], eax |
609 | mov [edi+16], eax |
610 | jmp .l4 |
610 | jmp .l4 |
611 | 611 | ||
612 | @@: |
612 | @@: |
613 | mov [edi+20], eax |
613 | mov [edi+20], eax |
614 | 614 | ||
615 | .l4: |
615 | .l4: |
616 | test eax, eax |
616 | test eax, eax |
617 | je .done |
617 | je .done |
618 | 618 | ||
619 | .l5: |
619 | .l5: |
620 | mov [eax+24], edi |
620 | mov [eax+24], edi |
621 | mov ecx, [edx+16] |
621 | mov ecx, [edx+16] |
622 | test ecx, ecx |
622 | test ecx, ecx |
623 | je .l6 |
623 | je .l6 |
624 | 624 | ||
625 | mov [eax+16], ecx |
625 | mov [eax+16], ecx |
626 | mov [ecx+24], eax |
626 | mov [ecx+24], eax |
627 | 627 | ||
628 | .l6: |
628 | .l6: |
629 | mov edx, [edx+20] |
629 | mov edx, [edx+20] |
630 | test edx, edx |
630 | test edx, edx |
631 | je .done |
631 | je .done |
632 | 632 | ||
633 | mov [eax+20], edx |
633 | mov [eax+20], edx |
634 | mov [edx+24], eax |
634 | mov [edx+24], eax |
635 | 635 | ||
636 | .done: |
636 | .done: |
637 | pop edi |
637 | pop edi |
638 | ret |
638 | ret |
639 | 639 | ||
640 | ; param |
640 | ; param |
641 | ; esi= nb |
641 | ; esi= nb |
642 | 642 | ||
643 | malloc_small: |
643 | malloc_small: |
644 | push ebp |
644 | push ebp |
645 | mov ebp, esi |
645 | mov ebp, esi |
646 | 646 | ||
647 | push edi |
647 | push edi |
648 | 648 | ||
649 | bsf eax, [mst.treemap] |
649 | bsf eax, [mst.treemap] |
650 | mov ecx, [mst.treebins+eax*4] |
650 | mov ecx, [mst.treebins+eax*4] |
651 | 651 | ||
652 | ; rsize = (t->head & ~INUSE_BITS) - nb; |
652 | ; rsize = (t->head & ~INUSE_BITS) - nb; |
653 | 653 | ||
654 | mov edi, [ecx+4] |
654 | mov edi, [ecx+4] |
655 | and edi, -4 |
655 | and edi, -4 |
656 | sub edi, esi |
656 | sub edi, esi |
657 | 657 | ||
658 | .loop: |
658 | .loop: |
659 | mov ebx, ecx |
659 | mov ebx, ecx |
660 | 660 | ||
661 | .loop_1: |
661 | .loop_1: |
662 | 662 | ||
663 | ; while ((t = leftmost_child(t)) != 0) |
663 | ; while ((t = leftmost_child(t)) != 0) |
664 | 664 | ||
665 | mov eax, [ecx+16] |
665 | mov eax, [ecx+16] |
666 | test eax, eax |
666 | test eax, eax |
667 | jz @F |
667 | jz @F |
668 | mov ecx, eax |
668 | mov ecx, eax |
669 | jmp .l1 |
669 | jmp .l1 |
670 | 670 | ||
671 | @@: |
671 | @@: |
672 | mov ecx, [ecx+20] |
672 | mov ecx, [ecx+20] |
673 | 673 | ||
674 | .l1: |
674 | .l1: |
675 | test ecx, ecx |
675 | test ecx, ecx |
676 | jz .unlink |
676 | jz .unlink |
677 | 677 | ||
678 | ; trem = (t->head & ~INUSE_BITS) - nb; |
678 | ; trem = (t->head & ~INUSE_BITS) - nb; |
679 | 679 | ||
680 | mov eax, [ecx+4] |
680 | mov eax, [ecx+4] |
681 | and eax, -4 |
681 | and eax, -4 |
682 | sub eax, ebp |
682 | sub eax, ebp |
683 | 683 | ||
684 | ; if (trem < rsize) |
684 | ; if (trem < rsize) |
685 | 685 | ||
686 | cmp eax, edi |
686 | cmp eax, edi |
687 | jae .loop_1 |
687 | jae .loop_1 |
688 | 688 | ||
689 | ; rsize = trem; |
689 | ; rsize = trem; |
690 | 690 | ||
691 | mov edi, eax |
691 | mov edi, eax |
692 | jmp .loop |
692 | jmp .loop |
693 | .unlink: |
693 | .unlink: |
694 | 694 | ||
695 | 695 | ||
696 | ; r = chunk_plus_offset((mchunkptr)v, nb); |
696 | ; r = chunk_plus_offset((mchunkptr)v, nb); |
697 | ; unlink_large_chunk(v); |
697 | ; unlink_large_chunk(v); |
698 | 698 | ||
699 | mov edx, ebx |
699 | mov edx, ebx |
700 | lea esi, [ebx+ebp] |
700 | lea esi, [ebx+ebp] |
701 | call unlink_large_chunk |
701 | call unlink_large_chunk |
702 | 702 | ||
703 | ; if (rsize < 16) |
703 | ; if (rsize < 16) |
704 | 704 | ||
705 | cmp edi, 16 |
705 | cmp edi, 16 |
706 | jae .split |
706 | jae .split |
707 | 707 | ||
708 | ; v->head = (rsize + nb)|PINUSE_BIT|CINUSE_BIT; |
708 | ; v->head = (rsize + nb)|PINUSE_BIT|CINUSE_BIT; |
709 | 709 | ||
710 | lea ecx, [edi+ebp] |
710 | lea ecx, [edi+ebp] |
711 | 711 | ||
712 | ; (v+rsize + nb)->head |= PINUSE_BIT; |
712 | ; (v+rsize + nb)->head |= PINUSE_BIT; |
713 | 713 | ||
714 | add edi, ebx |
714 | add edi, ebx |
715 | lea eax, [edi+ebp+4] |
715 | lea eax, [edi+ebp+4] |
716 | pop edi |
716 | pop edi |
717 | or ecx, 3 |
717 | or ecx, 3 |
718 | mov [ebx+4], ecx |
718 | mov [ebx+4], ecx |
719 | or dword [eax], 1 |
719 | or dword [eax], 1 |
720 | pop ebp |
720 | pop ebp |
721 | 721 | ||
722 | lea eax, [ebx+8] |
722 | lea eax, [ebx+8] |
723 | ret |
723 | ret |
724 | 724 | ||
725 | .split: |
725 | .split: |
726 | 726 | ||
727 | ; v->head = nb|PINUSE_BIT|CINUSE_BIT; |
727 | ; v->head = nb|PINUSE_BIT|CINUSE_BIT; |
728 | ; r->head = rsize|PINUSE_BIT; |
728 | ; r->head = rsize|PINUSE_BIT; |
729 | ; (r+rsize)->prev_foot = rsize; |
729 | ; (r+rsize)->prev_foot = rsize; |
730 | 730 | ||
731 | or ebp, 3 |
731 | or ebp, 3 |
732 | mov edx, edi |
732 | mov edx, edi |
733 | or edx, 1 |
733 | or edx, 1 |
734 | 734 | ||
735 | cmp edi, 256 |
735 | cmp edi, 256 |
736 | mov [ebx+4], ebp |
736 | mov [ebx+4], ebp |
737 | mov [esi+4], edx |
737 | mov [esi+4], edx |
738 | mov [esi+edi], edi |
738 | mov [esi+edi], edi |
739 | jae .large |
739 | jae .large |
740 | 740 | ||
741 | shr edi, 3 |
741 | shr edi, 3 |
742 | bts [mst.smallmap], edi |
742 | bts [mst.smallmap], edi |
743 | 743 | ||
744 | mov eax, edi |
744 | mov eax, edi |
745 | shl eax, 4 |
745 | shl eax, 4 |
746 | add eax, mst.smallbins |
746 | add eax, mst.smallbins |
747 | 747 | ||
748 | mov edx, [eax+8] |
748 | mov edx, [eax+8] |
749 | mov [eax+8], esi |
749 | mov [eax+8], esi |
750 | mov [edx+12], esi |
750 | mov [edx+12], esi |
751 | pop edi |
751 | pop edi |
752 | mov [esi+12], eax |
752 | mov [esi+12], eax |
753 | mov [esi+8], edx |
753 | mov [esi+8], edx |
754 | pop ebp |
754 | pop ebp |
755 | lea eax, [ebx+8] |
755 | lea eax, [ebx+8] |
756 | ret |
756 | ret |
757 | 757 | ||
758 | .large: |
758 | .large: |
759 | lea eax, [ebx+8] |
759 | lea eax, [ebx+8] |
760 | push eax |
760 | push eax |
761 | mov ebx, edi |
761 | mov ebx, edi |
762 | call insert_large_chunk |
762 | call insert_large_chunk |
763 | pop eax |
763 | pop eax |
764 | pop edi |
764 | pop edi |
765 | pop ebp |
765 | pop ebp |
766 | ret |
766 | ret |
767 | 767 | ||
768 | 768 | ||
769 | ; param |
769 | ; param |
770 | ; esi= nb |
770 | ; esi= nb |
771 | 771 | ||
772 | malloc_large: |
772 | malloc_large: |
773 | .idx equ esp+4 |
773 | .idx equ esp+4 |
774 | .rst equ esp |
774 | .rst equ esp |
775 | 775 | ||
776 | push ebp |
776 | push ebp |
777 | push esi |
777 | push esi |
778 | push edi |
778 | push edi |
779 | sub esp, 8 |
779 | sub esp, 8 |
780 | ; v = 0; |
780 | ; v = 0; |
781 | ; rsize = -nb; |
781 | ; rsize = -nb; |
782 | 782 | ||
783 | mov edi, esi |
783 | mov edi, esi |
784 | mov ebx, esi |
784 | mov ebx, esi |
785 | xor ebp, ebp |
785 | xor ebp, ebp |
786 | neg edi |
786 | neg edi |
787 | 787 | ||
788 | ; idx = compute_tree_index(nb); |
788 | ; idx = compute_tree_index(nb); |
789 | 789 | ||
790 | mov edx, esi |
790 | mov edx, esi |
791 | shr edx, 8 |
791 | shr edx, 8 |
792 | bsr eax, edx |
792 | bsr eax, edx |
793 | lea ecx, [eax+7] |
793 | lea ecx, [eax+7] |
794 | shr esi, cl |
794 | shr esi, cl |
795 | and esi, 1 |
795 | and esi, 1 |
796 | lea ecx, [esi+eax*2] |
796 | lea ecx, [esi+eax*2] |
797 | mov [.idx], ecx |
797 | mov [.idx], ecx |
798 | 798 | ||
799 | ; if ((t = ms.treebins[idx]) != 0) |
799 | ; if ((t = ms.treebins[idx]) != 0) |
800 | 800 | ||
801 | mov eax, [mst.treebins+ecx*4] |
801 | mov eax, [mst.treebins+ecx*4] |
802 | test eax, eax |
802 | test eax, eax |
803 | jz .l3 |
803 | jz .l3 |
804 | 804 | ||
805 | ; sizebits = nb << leftshift_for_tree_index(idx); |
805 | ; sizebits = nb << leftshift_for_tree_index(idx); |
806 | 806 | ||
807 | cmp ecx, 31 |
807 | cmp ecx, 31 |
808 | jne @F |
808 | jne @F |
809 | xor ecx, ecx |
809 | xor ecx, ecx |
810 | jmp .l1 |
810 | jmp .l1 |
811 | 811 | ||
812 | @@: |
812 | @@: |
813 | mov edx, ecx |
813 | mov edx, ecx |
814 | shr edx, 1 |
814 | shr edx, 1 |
815 | mov ecx, 37 |
815 | mov ecx, 37 |
816 | sub ecx, edx |
816 | sub ecx, edx |
817 | 817 | ||
818 | .l1: |
818 | .l1: |
819 | mov edx, ebx |
819 | mov edx, ebx |
820 | shl edx, cl |
820 | shl edx, cl |
821 | 821 | ||
822 | ; rst = 0; |
822 | ; rst = 0; |
823 | mov [.rst], ebp |
823 | mov [.rst], ebp |
824 | 824 | ||
825 | .loop: |
825 | .loop: |
826 | 826 | ||
827 | ; trem = (t->head & ~INUSE_BITS) - nb; |
827 | ; trem = (t->head & ~INUSE_BITS) - nb; |
828 | 828 | ||
829 | mov ecx, [eax+4] |
829 | mov ecx, [eax+4] |
830 | and ecx, -4 |
830 | and ecx, -4 |
831 | sub ecx, ebx |
831 | sub ecx, ebx |
832 | 832 | ||
833 | ; if (trem < rsize) |
833 | ; if (trem < rsize) |
834 | 834 | ||
835 | cmp ecx, edi |
835 | cmp ecx, edi |
836 | jae @F |
836 | jae @F |
837 | ; v = t; |
837 | ; v = t; |
838 | ; if ((rsize = trem) == 0) |
838 | ; if ((rsize = trem) == 0) |
839 | 839 | ||
840 | test ecx, ecx |
840 | test ecx, ecx |
841 | mov ebp, eax |
841 | mov ebp, eax |
842 | mov edi, ecx |
842 | mov edi, ecx |
843 | je .l2 |
843 | je .l2 |
844 | 844 | ||
845 | @@: |
845 | @@: |
846 | 846 | ||
847 | ; rt = t->child[1]; |
847 | ; rt = t->child[1]; |
848 | 848 | ||
849 | mov ecx, [eax+20] |
849 | mov ecx, [eax+20] |
850 | 850 | ||
851 | ; t = t->child[(sizebits >> 31) & 1]; |
851 | ; t = t->child[(sizebits >> 31) & 1]; |
852 | 852 | ||
853 | mov esi, edx |
853 | mov esi, edx |
854 | shr esi, 31 |
854 | shr esi, 31 |
855 | 855 | ||
856 | ; if (rt != 0 && rt != t) |
856 | ; if (rt != 0 && rt != t) |
857 | 857 | ||
858 | test ecx, ecx |
858 | test ecx, ecx |
859 | mov eax, [eax+esi*4+16] |
859 | mov eax, [eax+esi*4+16] |
860 | jz @F |
860 | jz @F |
861 | cmp ecx, eax |
861 | cmp ecx, eax |
862 | jz @F |
862 | jz @F |
863 | 863 | ||
864 | ; rst = rt; |
864 | ; rst = rt; |
865 | mov [.rst], ecx |
865 | mov [.rst], ecx |
866 | 866 | ||
867 | @@: |
867 | @@: |
868 | ; if (t == 0) |
868 | ; if (t == 0) |
869 | 869 | ||
870 | test eax, eax |
870 | test eax, eax |
871 | jz @F |
871 | jz @F |
872 | 872 | ||
873 | ; sizebits <<= 1; |
873 | ; sizebits <<= 1; |
874 | 874 | ||
875 | add edx, edx |
875 | add edx, edx |
876 | jmp .loop |
876 | jmp .loop |
877 | 877 | ||
878 | @@: |
878 | @@: |
879 | ; t = rst; |
879 | ; t = rst; |
880 | mov eax, [.rst] |
880 | mov eax, [.rst] |
881 | 881 | ||
882 | .l2: |
882 | .l2: |
883 | ; if (t == 0 && v == 0) |
883 | ; if (t == 0 && v == 0) |
884 | 884 | ||
885 | test eax, eax |
885 | test eax, eax |
886 | jne .l4 |
886 | jne .l4 |
887 | test ebp, ebp |
887 | test ebp, ebp |
888 | jne .l7 |
888 | jne .l7 |
889 | mov ecx, [.idx] |
889 | mov ecx, [.idx] |
890 | 890 | ||
891 | .l3: |
891 | .l3: |
892 | 892 | ||
893 | ; leftbits = (-1< |
893 | ; leftbits = (-1< |
894 | ; if (leftbits != 0) |
894 | ; if (leftbits != 0) |
895 | 895 | ||
896 | or edx, -1 |
896 | or edx, -1 |
897 | shl edx, cl |
897 | shl edx, cl |
898 | and edx, [mst.treemap] |
898 | and edx, [mst.treemap] |
899 | jz @F |
899 | jz @F |
900 | 900 | ||
901 | bsf eax, edx |
901 | bsf eax, edx |
902 | ; t = ms.treebins[i]; |
902 | ; t = ms.treebins[i]; |
903 | mov eax, [mst.treebins+eax*4] |
903 | mov eax, [mst.treebins+eax*4] |
904 | 904 | ||
905 | @@: |
905 | @@: |
906 | 906 | ||
907 | ; while (t != 0) |
907 | ; while (t != 0) |
908 | test eax, eax |
908 | test eax, eax |
909 | jz .l5 |
909 | jz .l5 |
910 | 910 | ||
911 | .l4: |
911 | .l4: |
912 | 912 | ||
913 | ; trem = (t->head & ~INUSE_BITS) - nb; |
913 | ; trem = (t->head & ~INUSE_BITS) - nb; |
914 | 914 | ||
915 | mov ecx, [eax+4] |
915 | mov ecx, [eax+4] |
916 | and ecx, -4 |
916 | and ecx, -4 |
917 | sub ecx, ebx |
917 | sub ecx, ebx |
918 | 918 | ||
919 | ; if (trem < rsize) |
919 | ; if (trem < rsize) |
920 | 920 | ||
921 | cmp ecx, edi |
921 | cmp ecx, edi |
922 | jae @F |
922 | jae @F |
923 | ; rsize = trem; |
923 | ; rsize = trem; |
924 | 924 | ||
925 | mov edi, ecx |
925 | mov edi, ecx |
926 | ; v = t; |
926 | ; v = t; |
927 | mov ebp, eax |
927 | mov ebp, eax |
928 | 928 | ||
929 | @@: |
929 | @@: |
930 | 930 | ||
931 | ; t = leftmost_child(t); |
931 | ; t = leftmost_child(t); |
932 | 932 | ||
933 | mov ecx, [eax+16] |
933 | mov ecx, [eax+16] |
934 | test ecx, ecx |
934 | test ecx, ecx |
935 | je @F |
935 | je @F |
936 | mov eax, ecx |
936 | mov eax, ecx |
937 | jmp .l6 |
937 | jmp .l6 |
938 | 938 | ||
939 | @@: |
939 | @@: |
940 | mov eax, [eax+20] |
940 | mov eax, [eax+20] |
941 | 941 | ||
942 | .l6: |
942 | .l6: |
943 | 943 | ||
944 | ; while (t != 0) |
944 | ; while (t != 0) |
945 | 945 | ||
946 | test eax, eax |
946 | test eax, eax |
947 | jne .l4 |
947 | jne .l4 |
948 | 948 | ||
949 | .l5: |
949 | .l5: |
950 | 950 | ||
951 | ; if (v != 0) |
951 | ; if (v != 0) |
952 | 952 | ||
953 | test ebp, ebp |
953 | test ebp, ebp |
954 | jz .done |
954 | jz .done |
955 | 955 | ||
956 | .l7: |
956 | .l7: |
957 | 957 | ||
958 | ; r = chunk_plus_offset((mchunkptr)v, nb); |
958 | ; r = chunk_plus_offset((mchunkptr)v, nb); |
959 | ; unlink_large_chunk(v); |
959 | ; unlink_large_chunk(v); |
960 | 960 | ||
961 | mov edx, ebp |
961 | mov edx, ebp |
962 | lea esi, [ebx+ebp] |
962 | lea esi, [ebx+ebp] |
963 | call unlink_large_chunk |
963 | call unlink_large_chunk |
964 | 964 | ||
965 | ; if (rsize < 16) |
965 | ; if (rsize < 16) |
966 | 966 | ||
967 | cmp edi, 16 |
967 | cmp edi, 16 |
968 | jae .large |
968 | jae .large |
969 | 969 | ||
970 | ; v->head = (rsize + nb)|PINUSE_BIT|CINUSE_BIT; |
970 | ; v->head = (rsize + nb)|PINUSE_BIT|CINUSE_BIT; |
971 | 971 | ||
972 | lea ecx, [edi+ebx] |
972 | lea ecx, [edi+ebx] |
973 | 973 | ||
974 | ; (v+rsize + nb)->head |= PINUSE_BIT; |
974 | ; (v+rsize + nb)->head |= PINUSE_BIT; |
975 | 975 | ||
976 | add edi, ebp |
976 | add edi, ebp |
977 | lea eax, [edi+ebx+4] |
977 | lea eax, [edi+ebx+4] |
978 | or ecx, 3 |
978 | or ecx, 3 |
979 | mov [ebp+4], ecx |
979 | mov [ebp+4], ecx |
980 | or dword [eax], 1 |
980 | or dword [eax], 1 |
981 | lea eax, [ebp+8] |
981 | lea eax, [ebp+8] |
982 | add esp, 8 |
982 | add esp, 8 |
983 | pop edi |
983 | pop edi |
984 | pop esi |
984 | pop esi |
985 | pop ebp |
985 | pop ebp |
986 | ret |
986 | ret |
987 | 987 | ||
988 | .large: |
988 | .large: |
989 | 989 | ||
990 | ; v->head = nb|PINUSE_BIT|CINUSE_BIT; |
990 | ; v->head = nb|PINUSE_BIT|CINUSE_BIT; |
991 | ; r->head = rsize|PINUSE_BIT; |
991 | ; r->head = rsize|PINUSE_BIT; |
992 | 992 | ||
993 | mov edx, edi |
993 | mov edx, edi |
994 | or ebx, 3 |
994 | or ebx, 3 |
995 | mov [ebp+4], ebx |
995 | mov [ebp+4], ebx |
996 | or edx, 1 |
996 | or edx, 1 |
997 | mov [esi+4], edx |
997 | mov [esi+4], edx |
998 | 998 | ||
999 | ; (r+rsize)->prev_foot = rsize; |
999 | ; (r+rsize)->prev_foot = rsize; |
1000 | ; insert_large_chunk((tchunkptr)r, rsize); |
1000 | ; insert_large_chunk((tchunkptr)r, rsize); |
1001 | 1001 | ||
1002 | mov [esi+edi], edi |
1002 | mov [esi+edi], edi |
1003 | mov eax, edi |
1003 | mov eax, edi |
1004 | mov ecx, esi |
1004 | mov ecx, esi |
1005 | call insert_chunk |
1005 | call insert_chunk |
1006 | 1006 | ||
1007 | lea eax, [ebp+8] |
1007 | lea eax, [ebp+8] |
1008 | add esp, 8 |
1008 | add esp, 8 |
1009 | pop edi |
1009 | pop edi |
1010 | pop esi |
1010 | pop esi |
1011 | pop ebp |
1011 | pop ebp |
1012 | ret |
1012 | ret |
1013 | 1013 | ||
1014 | .done: |
1014 | .done: |
1015 | add esp, 8 |
1015 | add esp, 8 |
1016 | pop edi |
1016 | pop edi |
1017 | pop esi |
1017 | pop esi |
1018 | pop ebp |
1018 | pop ebp |
1019 | xor eax, eax |
1019 | xor eax, eax |
1020 | ret |
1020 | ret |
1021 | 1021 | ||
1022 | init_malloc: |
1022 | init_malloc: |
1023 | 1023 | ||
1024 | stdcall kernel_alloc, 0x40000 |
1024 | stdcall kernel_alloc, 0x40000 |
1025 | 1025 | ||
1026 | mov [mst.top], eax |
1026 | mov [mst.top], eax |
1027 | mov [mst.topsize], 128*1024 |
1027 | mov [mst.topsize], 128*1024 |
1028 | mov dword [eax+4], (128*1024) or 1 |
1028 | mov dword [eax+4], (128*1024) or 1 |
1029 | mov eax, mst.smallbins |
1029 | mov eax, mst.smallbins |
1030 | 1030 | ||
1031 | @@: |
1031 | @@: |
1032 | mov [eax+8], eax |
1032 | mov [eax+8], eax |
1033 | mov [eax+12], eax |
1033 | mov [eax+12], eax |
1034 | add eax, 16 |
1034 | add eax, 16 |
1035 | cmp eax, mst.smallbins+512 |
1035 | cmp eax, mst.smallbins+512 |
1036 | jb @B |
1036 | jb @B |
1037 | 1037 | ||
1038 | mov ecx, mst.mutex |
1038 | mov ecx, mst.mutex |
1039 | call mutex_init |
1039 | call mutex_init |
1040 | 1040 | ||
1041 | ret>> |
1041 | ret>> |
1042 | > |
1042 | > |
1043 | > |
1043 | > |
1044 | > |
1044 | > |
1045 | >><>>><>>>><>16) |
1045 | >><>>><>>>><>16) |
1046 | 1046 | ||
1047 | >3; |
1047 | >3; |
1048 | ;><3; |
1048 | ;><3; |
1049 | ;> |
1049 | ;> |