about summary refs log tree commit diff
path: root/src/stdio/putc.h
diff options
context:
space:
mode:
authorRich Felker <dalias@aerifal.cx>2018-10-18 12:47:26 -0400
committerRich Felker <dalias@aerifal.cx>2018-10-18 13:09:33 -0400
commit9dd19122565c70bc6e0fff35724c91a61209a629 (patch)
tree272f42ab2c781e3663063779ab4a2e338fdd147a /src/stdio/putc.h
parent7eda27d025d6d52f855588590366c83d737eb727 (diff)
downloadmusl-9dd19122565c70bc6e0fff35724c91a61209a629.tar.gz
musl-9dd19122565c70bc6e0fff35724c91a61209a629.tar.xz
musl-9dd19122565c70bc6e0fff35724c91a61209a629.zip
further optimize getc/putc when locking is needed
check whether the lock is free before loading the calling thread's
tid. if so, just use a dummy tid value that cannot compare equal to
any actual thread id (because it's one bit wider). this also avoids
the need to save the tid and pass it to locking_getc or locking_putc,
reducing register pressure.

this change might slightly hurt the case where the caller already
holds the lock, but it does not affect the single-threaded case, and
may significantly improve the multi-threaded case, especially on archs
where loading the thread pointer is disproportionately expensive like
early mips and arm ISA levels. but even on i386 it helps, at least on
some machines; I measured roughly a 10-15% improvement.
Diffstat (limited to 'src/stdio/putc.h')
-rw-r--r--src/stdio/putc.h10
1 files changed, 5 insertions, 5 deletions
diff --git a/src/stdio/putc.h b/src/stdio/putc.h
index a37937e8..2014c4ec 100644
--- a/src/stdio/putc.h
+++ b/src/stdio/putc.h
@@ -4,9 +4,9 @@
 #ifdef __GNUC__
 __attribute__((__noinline__))
 #endif
-static int locking_putc(int c, FILE *f, int tid)
+static int locking_putc(int c, FILE *f)
 {
-	if (a_cas(&f->lock, 0, tid)) __lockfile(f);
+	if (a_cas(&f->lock, 0, MAYBE_WAITERS-1)) __lockfile(f);
 	c = putc_unlocked(c, f);
 	if (a_swap(&f->lock, 0) & MAYBE_WAITERS)
 		__wake(&f->lock, 1, 1);
@@ -15,8 +15,8 @@ static int locking_putc(int c, FILE *f, int tid)
 
 static inline int do_putc(int c, FILE *f)
 {
-	int tid, l = f->lock;
-	if (l < 0 || (l & ~MAYBE_WAITERS) == (tid=__pthread_self()->tid))
+	int l = f->lock;
+	if (l < 0 || l && (l & ~MAYBE_WAITERS) == __pthread_self()->tid)
 		return putc_unlocked(c, f);
-	return locking_putc(c, f, tid);
+	return locking_putc(c, f);
 }