sync: implement pool.work_on_items to process a list of items in parallel

2023-08-10 21:13:21 +03:00 · 2020-03-04 20:28:42 +01:00
parent 136aa763a3
commit b0ece3a9d8
7 changed files with 423 additions and 215 deletions
--- a/examples/news_fetcher.v
+++ b/examples/news_fetcher.v
@@ -5,47 +5,26 @@ import net.http
 import json
 import sync

-const (
-	nr_threads = 4
-)
-
 struct Story {
 	title string
 	url   string
 }

-struct Fetcher {
-mut:
-	mu     &sync.Mutex
-	ids    []int
-	cursor int
-	wg     &sync.WaitGroup
-}
-
-fn (f mut Fetcher) fetch() {
-	for {
-		if f.cursor >= f.ids.len {
-			return
-		}
-		id := f.ids[f.cursor]
-		f.mu.lock()
-		f.cursor++
-		f.mu.unlock()
-		cursor := f.cursor
-		resp := http.get('https://hacker-news.firebaseio.com/v0/item/${id}.json') or {
-			println('failed to fetch data from /v0/item/${id}.json')
-			exit(1)
-		}
-		story := json.decode(Story,resp.text) or {
-			println('failed to decode a story')
-			exit(1)
-		}
-		println('#$cursor) $story.title | $story.url')
-		f.wg.done()
+fn worker_fetch(p &sync.PoolProcessor, cursor int, worker_id int) voidptr {
+	id := p.get_item<int>(cursor)
+	resp := http.get('https://hacker-news.firebaseio.com/v0/item/${id}.json') or {
+		println('failed to fetch data from /v0/item/${id}.json')
+		return sync.no_result
 	}
+	story := json.decode(Story,resp.text) or {
+		println('failed to decode a story')
+		return sync.no_result
+	}
+	println('# $cursor) $story.title | $story.url')
+	return sync.no_result
 }

-// Fetches top HN stories in 4 coroutines
+// Fetches top HN stories in parallel, depending on how many cores you have
 fn main() {
 	resp := http.get('https://hacker-news.firebaseio.com/v0/topstories.json') or {
 		println('failed to fetch data from /v0/topstories.json')
@@ -56,22 +35,15 @@ fn main() {
 		return
 	}
 	if ids.len > 10 {
-		// ids = ids[:10]
-		mut tmp := [0].repeat(10)
-		for i in 0..10 {
-			tmp[i] = ids[i]
-		}
-		ids = tmp
+		ids = ids[0..10]
 	}
-	mut fetcher := &Fetcher{
-		ids: ids
-		mu: sync.new_mutex()
-		wg: sync.new_waitgroup()
-	}
-	fetcher.wg.add(ids.len)
-	for i in 0..nr_threads {
-		go fetcher.fetch()
-	}
-	fetcher.wg.wait()
+	mut fetcher_pool := sync.new_pool_processor({
+		callback: worker_fetch
+	})
+	// NB: if you do not call set_max_jobs, the pool will try to use an optimal
+	// number of threads, one per each core in your system, which in most
+	// cases is what you want anyway... You can override the automatic choice
+	// by setting the VJOBS environment variable too.
+	// fetcher_pool.set_max_jobs( 4 )
+	fetcher_pool.work_on_items<int>(ids)
 }
-