Using atomic instead of mutex and delete scratch slice #1833

NikoMalik · 2024-08-16T15:53:35Z

No description provided.

workerpool.go

newacorn · 2024-08-17T00:38:36Z

Whether using an array with a lock or a linked list with atomic operations to manage the workerChan resources, the subsequent operations on workerChan are I/O-intensive. Given that the operations are FILO and each element involves significant I/O, I don't think a linked list has any particular advantage.

NikoMalik · 2024-08-17T06:54:45Z

Whether using an array with a lock or a linked list with atomic operations to manage the workerChan resources, the subsequent operations on workerChan are I/O-intensive. Given that the operations are FILO and each element involves significant I/O, I don't think a linked list has any particular advantage.

I got a boost in benchmark tests by almost a factor and a half

workerpool.go

erikdubbelboer · 2024-08-20T21:18:32Z

Can you show which benchmarks and their results here?

NikoMalik · 2024-08-21T08:45:16Z

func BenchmarkWorkerPoolStartStopSerial(b *testing.B) {
	for i := 0; i < b.N; i++ {
		testWorkerPoolStartStopBENCH()
	}
}

func BenchmarkWorkerPoolStartStopConcurrent(b *testing.B) {
	concurrency := 10
	ch := make(chan struct{}, concurrency)
	b.ResetTimer()
	for i := 0; i < b.N; i++ {
		for j := 0; j < concurrency; j++ {
			go func() {
				testWorkerPoolStartStopBENCH()
				ch <- struct{}{}
			}()
		}
		for j := 0; j < concurrency; j++ {
			select {
			case <-ch:
			case <-time.After(time.Second):
				b.Fatalf("timeout")
			}
		}
	}
}

func BenchmarkWorkerPoolMaxWorkersCountSerial(b *testing.B) {
	for i := 0; i < b.N; i++ {
		testWorkerPoolMaxWorkersCountMultiBENCH(b)
	}
}

func BenchmarkWorkerPoolMaxWorkersCountConcurrent(b *testing.B) {
	concurrency := 4
	ch := make(chan struct{}, concurrency)
	b.ResetTimer()
	for i := 0; i < b.N; i++ {
		for j := 0; j < concurrency; j++ {
			go func() {
				testWorkerPoolMaxWorkersCountMultiBENCH(b)
				ch <- struct{}{}
			}()
		}
		for j := 0; j < concurrency; j++ {
			select {
			case <-ch:
			case <-time.After(time.Second * 2):
				b.Fatalf("timeout")
			}
		}
	}
}

func testWorkerPoolStartStopBENCH() {
	wp := &workerPool{
		WorkerFunc:      func(conn net.Conn) error { return nil },
		MaxWorkersCount: 10,
		Logger:          defaultLogger,
	}
	for i := 0; i < 10; i++ {
		wp.Start()
		wp.Stop()
	}
}

func testWorkerPoolMaxWorkersCountMultiBENCH(b *testing.B) {
	for i := 0; i < 5; i++ {
		testWorkerPoolMaxWorkersCountBENCH(b)
	}
}

func testWorkerPoolMaxWorkersCountBENCH(b *testing.B) {
	ready := make(chan struct{})
	wp := &workerPool{
		WorkerFunc: func(conn net.Conn) error {
			buf := make([]byte, 100)
			n, err := conn.Read(buf)
			if err != nil {
				b.Errorf("unexpected error: %v", err)
			}
			buf = buf[:n]
			if string(buf) != "foobar" {
				b.Errorf("unexpected data read: %q. Expecting %q", buf, "foobar")
			}
			if _, err = conn.Write([]byte("baz")); err != nil {
				b.Errorf("unexpected error: %v", err)
			}

			<-ready

			return nil
		},
		MaxWorkersCount: 10,
		Logger:          defaultLogger,
		connState:       func(net.Conn, ConnState) {},
	}
	wp.Start()

	ln := fasthttputil.NewInmemoryListener()

	clientCh := make(chan struct{}, wp.MaxWorkersCount)
	for i := 0; i < wp.MaxWorkersCount; i++ {
		go func() {
			conn, err := ln.Dial()
			if err != nil {
				b.Errorf("unexpected error: %v", err)
			}
			if _, err = conn.Write([]byte("foobar")); err != nil {
				b.Errorf("unexpected error: %v", err)
			}
			data, err := io.ReadAll(conn)
			if err != nil {
				b.Errorf("unexpected error: %v", err)
			}
			if string(data) != "baz" {
				b.Errorf("unexpected value read: %q. Expecting %q", data, "baz")
			}
			if err = conn.Close(); err != nil {
				b.Errorf("unexpected error: %v", err)
			}
			clientCh <- struct{}{}
		}()
	}

	for i := 0; i < wp.MaxWorkersCount; i++ {
		conn, err := ln.Accept()
		if err != nil {
			b.Fatalf("unexpected error: %v", err)
		}
		if !wp.Serve(conn) {
			b.Fatalf("worker pool must have enough workers to serve the conn")
		}
	}

	go func() {
		if _, err := ln.Dial(); err != nil {
			b.Errorf("unexpected error: %v", err)
		}
	}()
	conn, err := ln.Accept()
	if err != nil {
		b.Fatalf("unexpected error: %v", err)
	}
	for i := 0; i < 5; i++ {
		if wp.Serve(conn) {
			b.Fatalf("worker pool must be full")
		}
	}
	if err = conn.Close(); err != nil {
		b.Fatalf("unexpected error: %v", err)
	}

	close(ready)

	for i := 0; i < wp.MaxWorkersCount; i++ {
		select {
		case <-clientCh:
		case <-time.After(time.Second):
			b.Fatalf("timeout")
		}
	}

	if err := ln.Close(); err != nil {
		b.Fatalf("unexpected error: %v", err)
	}
	wp.Stop()
}

I used this benchmark based on tests
resultsUsingAtomic:

goarch: amd64
pkg: github.com/valyala/fasthttp
cpu: 11th Gen Intel(R) Core(TM) i5-11400F @ 2.60GHz
=== RUN   BenchmarkWorkerPoolStartStopSerial
BenchmarkWorkerPoolStartStopSerial
BenchmarkWorkerPoolStartStopSerial-12
  216567              5454 ns/op            1494 B/op         21 allocs/op
=== RUN   BenchmarkWorkerPoolStartStopConcurrent
BenchmarkWorkerPoolStartStopConcurrent
BenchmarkWorkerPoolStartStopConcurrent-12
   35728             31353 ns/op           17913 B/op        250 allocs/op
=== RUN   BenchmarkWorkerPoolMaxWorkersCountSerial
BenchmarkWorkerPoolMaxWorkersCountSerial
BenchmarkWorkerPoolMaxWorkersCountSerial-12
    2488            523983 ns/op          253846 B/op       1143 allocs/op
=== RUN   BenchmarkWorkerPoolMaxWorkersCountConcurrent
BenchmarkWorkerPoolMaxWorkersCountConcurrent
BenchmarkWorkerPoolMaxWorkersCountConcurrent-12
    1339            811728 ns/op         1019013 B/op       4624 allocs/op
PASS
ok      github.com/valyala/fasthttp     5.554s

resultsUsingMutexAndSlice:

goarch: amd64
pkg: github.com/valyala/fasthttp
cpu: 11th Gen Intel(R) Core(TM) i5-11400F @ 2.60GHz
=== RUN   BenchmarkWorkerPoolStartStopSerial
BenchmarkWorkerPoolStartStopSerial
BenchmarkWorkerPoolStartStopSerial-12
  211056              5594 ns/op            1508 B/op         21 allocs/op
=== RUN   BenchmarkWorkerPoolStartStopConcurrent
BenchmarkWorkerPoolStartStopConcurrent
BenchmarkWorkerPoolStartStopConcurrent-12
   35869             32778 ns/op           18003 B/op        250 allocs/op
=== RUN   BenchmarkWorkerPoolMaxWorkersCountSerial
BenchmarkWorkerPoolMaxWorkersCountSerial
BenchmarkWorkerPoolMaxWorkersCountSerial-12
    2433            537527 ns/op          256182 B/op       1093 allocs/op
=== RUN   BenchmarkWorkerPoolMaxWorkersCountConcurrent
BenchmarkWorkerPoolMaxWorkersCountConcurrent
BenchmarkWorkerPoolMaxWorkersCountConcurrent-12
    1458            876898 ns/op         1027666 B/op       4420 allocs/op
PASS
ok      github.com/valyala/fasthttp     5.788s

erikdubbelboer · 2024-08-21T20:40:46Z

Any idea what is causing the extra allocations?

This option immediately exits the loop when the maximum number of vorkers is reached, rather than creating a new vorker if the limit is reached. This reduces the frequency of unnecessary operations and potential locks in sync.Pool

NikoMalik · 2024-08-22T09:41:13Z

Any idea what is causing the extra allocations?

i fixed

cpu: 11th Gen Intel(R) Core(TM) i5-11400F @ 2.60GHz
=== RUN   BenchmarkWorkerPoolStartStopSerial
BenchmarkWorkerPoolStartStopSerial
BenchmarkWorkerPoolStartStopSerial-12
  205198              5466 ns/op            1494 B/op         21 allocs/op
=== RUN   BenchmarkWorkerPoolStartStopConcurrent
BenchmarkWorkerPoolStartStopConcurrent
BenchmarkWorkerPoolStartStopConcurrent-12
   34980             30404 ns/op           17959 B/op        250 allocs/op
=== RUN   BenchmarkWorkerPoolMaxWorkersCountSerial
BenchmarkWorkerPoolMaxWorkersCountSerial
BenchmarkWorkerPoolMaxWorkersCountSerial-12
    2520            509416 ns/op          251338 B/op       1050 allocs/op
=== RUN   BenchmarkWorkerPoolMaxWorkersCountConcurrent
BenchmarkWorkerPoolMaxWorkersCountConcurrent
BenchmarkWorkerPoolMaxWorkersCountConcurrent-12
    1652            782699 ns/op         1008180 B/op       4218 allocs/op
PASS
ok      github.com/valyala/fasthttp     5.588s

problem was in getch()

erikdubbelboer

Our linter would like to see some changes.

workerpool.go

Co-authored-by: Erik Dubbelboer <erik@dubbelboer.com>

erikdubbelboer

Seems like the code isn't completely thread safe, 3 tests failed with the race detector.

NikoMalik · 2024-08-24T08:53:00Z

Seems like the code isn't completely thread safe, 3 tests failed with the race detector.

I may have ruled out the last possible data races

erikdubbelboer · 2024-08-25T15:03:11Z

Thanks!

…la#1833)" This reverts commit 19c50cd.

* Remove a redundant field and clarify the comments. * Revert "Using atomic instead of mutex and delete scratch slice (#1833)" This reverts commit 19c50cd.

NikoMalik added 4 commits August 16, 2024 18:36

using atomic instead of mutex and delete scratch slice

a445f0b

optimize struct

a2774f1

fix default bool

f57605c

escape data race

029d7a5

newacorn reviewed Aug 17, 2024

View reviewed changes

workerpool.go Outdated Show resolved Hide resolved

avoid the momentary change of wp.workersCount.

63f18b9

erikdubbelboer requested changes Aug 20, 2024

View reviewed changes

workerpool.go Outdated Show resolved Hide resolved

NikoMalik added 2 commits August 21, 2024 10:44

removed unused tail (for now)

85cbb8d

little fixes

3403412

fixed allocations

7ac1336

This option immediately exits the loop when the maximum number of vorkers is reached, rather than creating a new vorker if the limit is reached. This reduces the frequency of unnecessary operations and potential locks in sync.Pool

erikdubbelboer requested changes Aug 23, 2024

View reviewed changes

workerpool.go Show resolved Hide resolved

workerpool.go Outdated Show resolved Hide resolved

workerpool.go Outdated Show resolved Hide resolved

NikoMalik and others added 4 commits August 24, 2024 10:26

Update for linter workerpool.go

8f2aa8e

Co-authored-by: Erik Dubbelboer <erik@dubbelboer.com>

Update for lint#2 workerpool.go

8fa3f4e

Co-authored-by: Erik Dubbelboer <erik@dubbelboer.com>

Update for lint#3 workerpool.go

1b03099

Co-authored-by: Erik Dubbelboer <erik@dubbelboer.com>

Update for lint#4 workerpool.go

bfecd4c

erikdubbelboer requested changes Aug 24, 2024

View reviewed changes

eliminating potential data races

9b9be0b

NikoMalik requested a review from erikdubbelboer August 24, 2024 15:17

erikdubbelboer merged commit 19c50cd into valyala:master Aug 25, 2024
15 checks passed

newacorn added a commit to newacorn/fasthttp that referenced this pull request Aug 26, 2024

Revert "Using atomic instead of mutex and delete scratch slice (valya…

4305014

…la#1833)" This reverts commit 19c50cd.

newacorn mentioned this pull request Aug 26, 2024

Revert "Using atomic instead of mutex and delete scratch slice" #1846

Merged

newacorn added a commit to newacorn/fasthttp that referenced this pull request Sep 7, 2024

Revert "Using atomic instead of mutex and delete scratch slice (valya…

8b0df66

…la#1833)" This reverts commit 19c50cd.

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Using atomic instead of mutex and delete scratch slice #1833

Using atomic instead of mutex and delete scratch slice #1833

NikoMalik commented Aug 16, 2024

newacorn commented Aug 17, 2024

NikoMalik commented Aug 17, 2024

erikdubbelboer commented Aug 20, 2024

NikoMalik commented Aug 21, 2024

erikdubbelboer commented Aug 21, 2024

NikoMalik commented Aug 22, 2024 •

edited

Loading

erikdubbelboer left a comment

erikdubbelboer left a comment

NikoMalik commented Aug 24, 2024

erikdubbelboer commented Aug 25, 2024

Using atomic instead of mutex and delete scratch slice #1833

Using atomic instead of mutex and delete scratch slice #1833

Conversation

NikoMalik commented Aug 16, 2024

newacorn commented Aug 17, 2024

NikoMalik commented Aug 17, 2024

erikdubbelboer commented Aug 20, 2024

NikoMalik commented Aug 21, 2024

erikdubbelboer commented Aug 21, 2024

NikoMalik commented Aug 22, 2024 • edited Loading

erikdubbelboer left a comment

Choose a reason for hiding this comment

erikdubbelboer left a comment

Choose a reason for hiding this comment

NikoMalik commented Aug 24, 2024

erikdubbelboer commented Aug 25, 2024

NikoMalik commented Aug 22, 2024 •

edited

Loading