[FFmpeg-devel] [PATCH] Stop using _explicit atomic operations where not necessary.
James Almer
jamrial at gmail.com
Sat Jun 5 17:46:01 EEST 2021
On 6/5/2021 11:27 AM, Anton Khirnov wrote:
> Memory ordering constraints other than the default (sequentially
> consistent) can behave in very unintuitive and unexpected ways, and so
> should be avoided unless there is a strong (typically performance)
> reason for using them. This holds especially for memory_order_relaxed,
> which imposes no ordering constraints.
Performance is important for FIFO, though. Could they use a laxer order
at least for the fetch_sub and fetch_add cases?
Also, commit fed50c4304e, which made cpu_flags an atomic type, states
that ThreadSanitizer stopped reporting races on tests/cpu_init after
that change, so maybe memory order is not important for it, only atomicity.
In any case these cpu and mem functions are hardly a bottleneck
anywhere, and rarely called outside of debugging, so this change is ok.
> ---
> libavformat/fifo.c | 8 ++++----
> libavutil/cpu.c | 8 ++++----
> libavutil/mem.c | 10 +++++-----
> 3 files changed, 13 insertions(+), 13 deletions(-)
>
> diff --git a/libavformat/fifo.c b/libavformat/fifo.c
> index 50656f78b7..2ac14207b8 100644
> --- a/libavformat/fifo.c
> +++ b/libavformat/fifo.c
> @@ -185,7 +185,7 @@ static int fifo_thread_write_packet(FifoThreadContext *ctx, AVPacket *pkt)
> int ret, s_idx;
>
> if (fifo->timeshift && pkt->dts != AV_NOPTS_VALUE)
> - atomic_fetch_sub_explicit(&fifo->queue_duration, next_duration(avf, pkt, &ctx->last_received_dts), memory_order_relaxed);
> + atomic_fetch_sub(&fifo->queue_duration, next_duration(avf, pkt, &ctx->last_received_dts));
>
> if (ctx->drop_until_keyframe) {
> if (pkt->flags & AV_PKT_FLAG_KEY) {
> @@ -454,7 +454,7 @@ static void *fifo_consumer_thread(void *data)
> av_log(avf, AV_LOG_INFO, "FIFO queue flushed\n");
>
> if (fifo->timeshift)
> - while (atomic_load_explicit(&fifo->queue_duration, memory_order_relaxed) < fifo->timeshift)
> + while (atomic_load(&fifo->queue_duration) < fifo->timeshift)
> av_usleep(10000);
>
> ret = av_thread_message_queue_recv(queue, &msg, 0);
> @@ -594,7 +594,7 @@ static int fifo_write_packet(AVFormatContext *avf, AVPacket *pkt)
> }
>
> if (fifo->timeshift && pkt && pkt->dts != AV_NOPTS_VALUE)
> - atomic_fetch_add_explicit(&fifo->queue_duration, next_duration(avf, pkt, &fifo->last_sent_dts), memory_order_relaxed);
> + atomic_fetch_add(&fifo->queue_duration, next_duration(avf, pkt, &fifo->last_sent_dts));
>
> return ret;
> fail:
> @@ -621,7 +621,7 @@ static int fifo_write_trailer(AVFormatContext *avf)
> } else {
> now += delay;
> }
> - atomic_fetch_add_explicit(&fifo->queue_duration, delay, memory_order_relaxed);
> + atomic_fetch_add(&fifo->queue_duration, delay);
> elapsed += delay;
> if (elapsed > fifo->timeshift)
> break;
> diff --git a/libavutil/cpu.c b/libavutil/cpu.c
> index 8960415d00..8a6af81ae4 100644
> --- a/libavutil/cpu.c
> +++ b/libavutil/cpu.c
> @@ -89,15 +89,15 @@ void av_force_cpu_flags(int arg){
> arg |= AV_CPU_FLAG_MMX;
> }
>
> - atomic_store_explicit(&cpu_flags, arg, memory_order_relaxed);
> + atomic_store(&cpu_flags, arg);
> }
>
> int av_get_cpu_flags(void)
> {
> - int flags = atomic_load_explicit(&cpu_flags, memory_order_relaxed);
> + int flags = atomic_load(&cpu_flags);
> if (flags == -1) {
> flags = get_cpu_flags();
> - atomic_store_explicit(&cpu_flags, flags, memory_order_relaxed);
> + atomic_store(&cpu_flags, flags);
> }
> return flags;
> }
> @@ -221,7 +221,7 @@ int av_cpu_count(void)
> nb_cpus = sysinfo.dwNumberOfProcessors;
> #endif
>
> - if (!atomic_exchange_explicit(&printed, 1, memory_order_relaxed))
> + if (!atomic_exchange(&printed, 1))
> av_log(NULL, AV_LOG_DEBUG, "detected %d logical cores\n", nb_cpus);
>
> return nb_cpus;
> diff --git a/libavutil/mem.c b/libavutil/mem.c
> index a52d33d4a6..c216c0314f 100644
> --- a/libavutil/mem.c
> +++ b/libavutil/mem.c
> @@ -72,14 +72,14 @@ void free(void *ptr);
> static atomic_size_t max_alloc_size = ATOMIC_VAR_INIT(INT_MAX);
>
> void av_max_alloc(size_t max){
> - atomic_store_explicit(&max_alloc_size, max, memory_order_relaxed);
> + atomic_store(&max_alloc_size, max);
> }
>
> void *av_malloc(size_t size)
> {
> void *ptr = NULL;
>
> - if (size > atomic_load_explicit(&max_alloc_size, memory_order_relaxed))
> + if (size > atomic_load(&max_alloc_size))
> return NULL;
>
> #if HAVE_POSIX_MEMALIGN
> @@ -135,7 +135,7 @@ void *av_malloc(size_t size)
> void *av_realloc(void *ptr, size_t size)
> {
> void *ret;
> - if (size > atomic_load_explicit(&max_alloc_size, memory_order_relaxed))
> + if (size > atomic_load(&max_alloc_size))
> return NULL;
>
> #if HAVE_ALIGNED_MALLOC
> @@ -489,7 +489,7 @@ void *av_fast_realloc(void *ptr, unsigned int *size, size_t min_size)
> if (min_size <= *size)
> return ptr;
>
> - max_size = atomic_load_explicit(&max_alloc_size, memory_order_relaxed);
> + max_size = atomic_load(&max_alloc_size);
>
> if (min_size > max_size) {
> *size = 0;
> @@ -521,7 +521,7 @@ static inline void fast_malloc(void *ptr, unsigned int *size, size_t min_size, i
> return;
> }
>
> - max_size = atomic_load_explicit(&max_alloc_size, memory_order_relaxed);
> + max_size = atomic_load(&max_alloc_size);
>
> if (min_size > max_size) {
> av_freep(ptr);
>
More information about the ffmpeg-devel
mailing list