mirror of
https://github.com/golang/go
synced 2024-11-18 15:04:44 -07:00
runtime: make cas64 like cas32 and casp
The current cas64 definition hard-codes the x86 behavior of updating *old with the new value when the cas fails. This is inconsistent with cas32 and casp. Make it consistent. This means that the cas64 uses will be epsilon less efficient than they might be, because they have to do an unnecessary memory load on x86. But so be it. Code clarity and consistency is more important. R=golang-dev, bradfitz CC=golang-dev https://golang.org/cl/10909045
This commit is contained in:
parent
3a8845b525
commit
fb63e4fefb
@ -374,13 +374,11 @@ TEXT runtime·cas(SB), 7, $0
|
|||||||
// *val = new;
|
// *val = new;
|
||||||
// return 1;
|
// return 1;
|
||||||
// } else {
|
// } else {
|
||||||
// *old = *val
|
|
||||||
// return 0;
|
// return 0;
|
||||||
// }
|
// }
|
||||||
TEXT runtime·cas64(SB), 7, $0
|
TEXT runtime·cas64(SB), 7, $0
|
||||||
MOVQ 8(SP), BX
|
MOVQ 8(SP), BX
|
||||||
MOVQ 16(SP), BP
|
MOVQ 16(SP), AX
|
||||||
MOVQ 0(BP), AX
|
|
||||||
MOVQ 24(SP), CX
|
MOVQ 24(SP), CX
|
||||||
LOCK
|
LOCK
|
||||||
CMPXCHGQ CX, 0(BX)
|
CMPXCHGQ CX, 0(BX)
|
||||||
@ -388,7 +386,6 @@ TEXT runtime·cas64(SB), 7, $0
|
|||||||
MOVL $1, AX
|
MOVL $1, AX
|
||||||
RET
|
RET
|
||||||
cas64_fail:
|
cas64_fail:
|
||||||
MOVQ AX, 0(BP)
|
|
||||||
MOVL $0, AX
|
MOVL $0, AX
|
||||||
RET
|
RET
|
||||||
|
|
||||||
|
@ -24,10 +24,10 @@ runtime·xadd64(uint64 volatile* addr, int64 v)
|
|||||||
{
|
{
|
||||||
uint64 old;
|
uint64 old;
|
||||||
|
|
||||||
old = *addr;
|
do
|
||||||
while(!runtime·cas64(addr, &old, old+v)) {
|
old = *addr;
|
||||||
// nothing
|
while(!runtime·cas64(addr, old, old+v));
|
||||||
}
|
|
||||||
return old+v;
|
return old+v;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -37,9 +37,9 @@ runtime·xchg64(uint64 volatile* addr, uint64 v)
|
|||||||
{
|
{
|
||||||
uint64 old;
|
uint64 old;
|
||||||
|
|
||||||
old = *addr;
|
do
|
||||||
while(!runtime·cas64(addr, &old, v)) {
|
old = addr;
|
||||||
// nothing
|
while(!runtime·cas64(addr, old, v));
|
||||||
}
|
|
||||||
return old;
|
return old;
|
||||||
}
|
}
|
||||||
|
@ -92,16 +92,15 @@ runtime·atomicstore(uint32 volatile* addr, uint32 v)
|
|||||||
|
|
||||||
#pragma textflag 7
|
#pragma textflag 7
|
||||||
bool
|
bool
|
||||||
runtime·cas64(uint64 volatile *addr, uint64 *old, uint64 new)
|
runtime·cas64(uint64 volatile *addr, uint64 old, uint64 new)
|
||||||
{
|
{
|
||||||
bool res;
|
bool res;
|
||||||
|
|
||||||
runtime·lock(LOCK(addr));
|
runtime·lock(LOCK(addr));
|
||||||
if(*addr == *old) {
|
if(*addr == old) {
|
||||||
*addr = new;
|
*addr = new;
|
||||||
res = true;
|
res = true;
|
||||||
} else {
|
} else {
|
||||||
*old = *addr;
|
|
||||||
res = false;
|
res = false;
|
||||||
}
|
}
|
||||||
runtime·unlock(LOCK(addr));
|
runtime·unlock(LOCK(addr));
|
||||||
|
@ -29,10 +29,10 @@ runtime·lfstackpush(uint64 *head, LFNode *node)
|
|||||||
|
|
||||||
node->pushcnt++;
|
node->pushcnt++;
|
||||||
new = (uint64)(uintptr)node|(((uint64)node->pushcnt&CNT_MASK)<<PTR_BITS);
|
new = (uint64)(uintptr)node|(((uint64)node->pushcnt&CNT_MASK)<<PTR_BITS);
|
||||||
old = runtime·atomicload64(head);
|
|
||||||
for(;;) {
|
for(;;) {
|
||||||
|
old = runtime·atomicload64(head);
|
||||||
node->next = (LFNode*)(uintptr)(old&PTR_MASK);
|
node->next = (LFNode*)(uintptr)(old&PTR_MASK);
|
||||||
if(runtime·cas64(head, &old, new))
|
if(runtime·cas64(head, old, new))
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -43,8 +43,8 @@ runtime·lfstackpop(uint64 *head)
|
|||||||
LFNode *node, *node2;
|
LFNode *node, *node2;
|
||||||
uint64 old, new;
|
uint64 old, new;
|
||||||
|
|
||||||
old = runtime·atomicload64(head);
|
|
||||||
for(;;) {
|
for(;;) {
|
||||||
|
old = runtime·atomicload64(head);
|
||||||
if(old == 0)
|
if(old == 0)
|
||||||
return nil;
|
return nil;
|
||||||
node = (LFNode*)(uintptr)(old&PTR_MASK);
|
node = (LFNode*)(uintptr)(old&PTR_MASK);
|
||||||
@ -52,7 +52,7 @@ runtime·lfstackpop(uint64 *head)
|
|||||||
new = 0;
|
new = 0;
|
||||||
if(node2 != nil)
|
if(node2 != nil)
|
||||||
new = (uint64)(uintptr)node2|(((uint64)node2->pushcnt&CNT_MASK)<<PTR_BITS);
|
new = (uint64)(uintptr)node2|(((uint64)node2->pushcnt&CNT_MASK)<<PTR_BITS);
|
||||||
if(runtime·cas64(head, &old, new))
|
if(runtime·cas64(head, old, new))
|
||||||
return node;
|
return node;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -144,9 +144,9 @@ runtime·parfordo(ParFor *desc)
|
|||||||
if(victim >= tid)
|
if(victim >= tid)
|
||||||
victim++;
|
victim++;
|
||||||
victimpos = &desc->thr[victim].pos;
|
victimpos = &desc->thr[victim].pos;
|
||||||
pos = runtime·atomicload64(victimpos);
|
|
||||||
for(;;) {
|
for(;;) {
|
||||||
// See if it has any work.
|
// See if it has any work.
|
||||||
|
pos = runtime·atomicload64(victimpos);
|
||||||
begin = (uint32)pos;
|
begin = (uint32)pos;
|
||||||
end = (uint32)(pos>>32);
|
end = (uint32)(pos>>32);
|
||||||
if(begin+1 >= end) {
|
if(begin+1 >= end) {
|
||||||
@ -159,7 +159,7 @@ runtime·parfordo(ParFor *desc)
|
|||||||
}
|
}
|
||||||
begin2 = begin + (end-begin)/2;
|
begin2 = begin + (end-begin)/2;
|
||||||
newpos = (uint64)begin | (uint64)begin2<<32;
|
newpos = (uint64)begin | (uint64)begin2<<32;
|
||||||
if(runtime·cas64(victimpos, &pos, newpos)) {
|
if(runtime·cas64(victimpos, pos, newpos)) {
|
||||||
begin = begin2;
|
begin = begin2;
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
@ -157,11 +157,12 @@ TestAtomic64(void)
|
|||||||
z64 = 42;
|
z64 = 42;
|
||||||
x64 = 0;
|
x64 = 0;
|
||||||
PREFETCH(&z64);
|
PREFETCH(&z64);
|
||||||
if(runtime·cas64(&z64, &x64, 1))
|
if(runtime·cas64(&z64, x64, 1))
|
||||||
runtime·throw("cas64 failed");
|
runtime·throw("cas64 failed");
|
||||||
if(x64 != 42)
|
if(x64 != 0)
|
||||||
runtime·throw("cas64 failed");
|
runtime·throw("cas64 failed");
|
||||||
if(!runtime·cas64(&z64, &x64, 1))
|
x64 = 42;
|
||||||
|
if(!runtime·cas64(&z64, x64, 1))
|
||||||
runtime·throw("cas64 failed");
|
runtime·throw("cas64 failed");
|
||||||
if(x64 != 42 || z64 != 1)
|
if(x64 != 42 || z64 != 1)
|
||||||
runtime·throw("cas64 failed");
|
runtime·throw("cas64 failed");
|
||||||
@ -193,7 +194,7 @@ runtime·check(void)
|
|||||||
uint64 h;
|
uint64 h;
|
||||||
float32 i, i1;
|
float32 i, i1;
|
||||||
float64 j, j1;
|
float64 j, j1;
|
||||||
void* k;
|
byte *k, *k1;
|
||||||
uint16* l;
|
uint16* l;
|
||||||
struct x1 {
|
struct x1 {
|
||||||
byte x;
|
byte x;
|
||||||
@ -232,6 +233,17 @@ runtime·check(void)
|
|||||||
if(z != 4)
|
if(z != 4)
|
||||||
runtime·throw("cas4");
|
runtime·throw("cas4");
|
||||||
|
|
||||||
|
k = (byte*)0xfedcb123;
|
||||||
|
if(sizeof(void*) == 8)
|
||||||
|
k = (byte*)((uintptr)k<<10);
|
||||||
|
if(runtime·casp((void**)&k, nil, nil))
|
||||||
|
runtime·throw("casp1");
|
||||||
|
k1 = k+1;
|
||||||
|
if(!runtime·casp((void**)&k, k, k1))
|
||||||
|
runtime·throw("casp2");
|
||||||
|
if(k != k1)
|
||||||
|
runtime·throw("casp3");
|
||||||
|
|
||||||
*(uint64*)&j = ~0ULL;
|
*(uint64*)&j = ~0ULL;
|
||||||
if(j == j)
|
if(j == j)
|
||||||
runtime·throw("float64nan");
|
runtime·throw("float64nan");
|
||||||
|
@ -761,7 +761,7 @@ int32 runtime·write(int32, void*, int32);
|
|||||||
int32 runtime·close(int32);
|
int32 runtime·close(int32);
|
||||||
int32 runtime·mincore(void*, uintptr, byte*);
|
int32 runtime·mincore(void*, uintptr, byte*);
|
||||||
bool runtime·cas(uint32*, uint32, uint32);
|
bool runtime·cas(uint32*, uint32, uint32);
|
||||||
bool runtime·cas64(uint64*, uint64*, uint64);
|
bool runtime·cas64(uint64*, uint64, uint64);
|
||||||
bool runtime·casp(void**, void*, void*);
|
bool runtime·casp(void**, void*, void*);
|
||||||
// Don't confuse with XADD x86 instruction,
|
// Don't confuse with XADD x86 instruction,
|
||||||
// this one is actually 'addx', that is, add-and-fetch.
|
// this one is actually 'addx', that is, add-and-fetch.
|
||||||
|
Loading…
Reference in New Issue
Block a user