1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright (c) 2023 Meta Platforms, Inc. and affiliates. */
3 
4 #include <sys/types.h>
5 #include <sys/socket.h>
6 #include <pthread.h>
7 #include <argp.h>
8 
9 #include "bench.h"
10 #include "bench_local_storage_create.skel.h"
11 
12 struct thread {
13 	int *fds;
14 	pthread_t *pthds;
15 	int *pthd_results;
16 };
17 
18 static struct bench_local_storage_create *skel;
19 static struct thread *threads;
20 static long create_owner_errs;
21 static int storage_type = BPF_MAP_TYPE_SK_STORAGE;
22 static int batch_sz = 32;
23 
24 enum {
25 	ARG_BATCH_SZ = 9000,
26 	ARG_STORAGE_TYPE = 9001,
27 };
28 
29 static const struct argp_option opts[] = {
30 	{ "batch-size", ARG_BATCH_SZ, "BATCH_SIZE", 0,
31 	  "The number of storage creations in each batch" },
32 	{ "storage-type", ARG_STORAGE_TYPE, "STORAGE_TYPE", 0,
33 	  "The type of local storage to test (socket or task)" },
34 	{},
35 };
36 
parse_arg(int key,char * arg,struct argp_state * state)37 static error_t parse_arg(int key, char *arg, struct argp_state *state)
38 {
39 	int ret;
40 
41 	switch (key) {
42 	case ARG_BATCH_SZ:
43 		ret = atoi(arg);
44 		if (ret < 1) {
45 			fprintf(stderr, "invalid batch-size\n");
46 			argp_usage(state);
47 		}
48 		batch_sz = ret;
49 		break;
50 	case ARG_STORAGE_TYPE:
51 		if (!strcmp(arg, "task")) {
52 			storage_type = BPF_MAP_TYPE_TASK_STORAGE;
53 		} else if (!strcmp(arg, "socket")) {
54 			storage_type = BPF_MAP_TYPE_SK_STORAGE;
55 		} else {
56 			fprintf(stderr, "invalid storage-type (socket or task)\n");
57 			argp_usage(state);
58 		}
59 		break;
60 	default:
61 		return ARGP_ERR_UNKNOWN;
62 	}
63 
64 	return 0;
65 }
66 
67 const struct argp bench_local_storage_create_argp = {
68 	.options = opts,
69 	.parser = parse_arg,
70 };
71 
validate(void)72 static void validate(void)
73 {
74 	if (env.consumer_cnt != 0) {
75 		fprintf(stderr,
76 			"local-storage-create benchmark does not need consumer\n");
77 		exit(1);
78 	}
79 }
80 
setup(void)81 static void setup(void)
82 {
83 	int i;
84 
85 	skel = bench_local_storage_create__open_and_load();
86 	if (!skel) {
87 		fprintf(stderr, "error loading skel\n");
88 		exit(1);
89 	}
90 
91 	skel->bss->bench_pid = getpid();
92 	if (storage_type == BPF_MAP_TYPE_SK_STORAGE) {
93 		if (!bpf_program__attach(skel->progs.socket_post_create)) {
94 			fprintf(stderr, "Error attaching bpf program\n");
95 			exit(1);
96 		}
97 	} else {
98 		if (!bpf_program__attach(skel->progs.sched_process_fork)) {
99 			fprintf(stderr, "Error attaching bpf program\n");
100 			exit(1);
101 		}
102 	}
103 
104 	if (!bpf_program__attach(skel->progs.kmalloc)) {
105 		fprintf(stderr, "Error attaching bpf program\n");
106 		exit(1);
107 	}
108 
109 	threads = calloc(env.producer_cnt, sizeof(*threads));
110 
111 	if (!threads) {
112 		fprintf(stderr, "cannot alloc thread_res\n");
113 		exit(1);
114 	}
115 
116 	for (i = 0; i < env.producer_cnt; i++) {
117 		struct thread *t = &threads[i];
118 
119 		if (storage_type == BPF_MAP_TYPE_SK_STORAGE) {
120 			t->fds = malloc(batch_sz * sizeof(*t->fds));
121 			if (!t->fds) {
122 				fprintf(stderr, "cannot alloc t->fds\n");
123 				exit(1);
124 			}
125 		} else {
126 			t->pthds = malloc(batch_sz * sizeof(*t->pthds));
127 			if (!t->pthds) {
128 				fprintf(stderr, "cannot alloc t->pthds\n");
129 				exit(1);
130 			}
131 			t->pthd_results = malloc(batch_sz * sizeof(*t->pthd_results));
132 			if (!t->pthd_results) {
133 				fprintf(stderr, "cannot alloc t->pthd_results\n");
134 				exit(1);
135 			}
136 		}
137 	}
138 }
139 
measure(struct bench_res * res)140 static void measure(struct bench_res *res)
141 {
142 	res->hits = atomic_swap(&skel->bss->create_cnts, 0);
143 	res->drops = atomic_swap(&skel->bss->kmalloc_cnts, 0);
144 }
145 
sk_producer(void * input)146 static void *sk_producer(void *input)
147 {
148 	struct thread *t = &threads[(long)(input)];
149 	int *fds = t->fds;
150 	int i;
151 
152 	while (true) {
153 		for (i = 0; i < batch_sz; i++) {
154 			fds[i] = socket(AF_INET6, SOCK_DGRAM, 0);
155 			if (fds[i] == -1)
156 				atomic_inc(&create_owner_errs);
157 		}
158 
159 		for (i = 0; i < batch_sz; i++) {
160 			if (fds[i] != -1)
161 				close(fds[i]);
162 		}
163 	}
164 
165 	return NULL;
166 }
167 
thread_func(void * arg)168 static void *thread_func(void *arg)
169 {
170 	return NULL;
171 }
172 
task_producer(void * input)173 static void *task_producer(void *input)
174 {
175 	struct thread *t = &threads[(long)(input)];
176 	pthread_t *pthds = t->pthds;
177 	int *pthd_results = t->pthd_results;
178 	int i;
179 
180 	while (true) {
181 		for (i = 0; i < batch_sz; i++) {
182 			pthd_results[i] = pthread_create(&pthds[i], NULL, thread_func, NULL);
183 			if (pthd_results[i])
184 				atomic_inc(&create_owner_errs);
185 		}
186 
187 		for (i = 0; i < batch_sz; i++) {
188 			if (!pthd_results[i])
189 				pthread_join(pthds[i], NULL);
190 		}
191 	}
192 
193 	return NULL;
194 }
195 
producer(void * input)196 static void *producer(void *input)
197 {
198 	if (storage_type == BPF_MAP_TYPE_SK_STORAGE)
199 		return sk_producer(input);
200 	else
201 		return task_producer(input);
202 }
203 
report_progress(int iter,struct bench_res * res,long delta_ns)204 static void report_progress(int iter, struct bench_res *res, long delta_ns)
205 {
206 	double creates_per_sec, kmallocs_per_create;
207 
208 	creates_per_sec = res->hits / 1000.0 / (delta_ns / 1000000000.0);
209 	kmallocs_per_create = (double)res->drops / res->hits;
210 
211 	printf("Iter %3d (%7.3lfus): ",
212 	       iter, (delta_ns - 1000000000) / 1000.0);
213 	printf("creates %8.3lfk/s (%7.3lfk/prod), ",
214 	       creates_per_sec, creates_per_sec / env.producer_cnt);
215 	printf("%3.2lf kmallocs/create\n", kmallocs_per_create);
216 }
217 
report_final(struct bench_res res[],int res_cnt)218 static void report_final(struct bench_res res[], int res_cnt)
219 {
220 	double creates_mean = 0.0, creates_stddev = 0.0;
221 	long total_creates = 0, total_kmallocs = 0;
222 	int i;
223 
224 	for (i = 0; i < res_cnt; i++) {
225 		creates_mean += res[i].hits / 1000.0 / (0.0 + res_cnt);
226 		total_creates += res[i].hits;
227 		total_kmallocs += res[i].drops;
228 	}
229 
230 	if (res_cnt > 1)  {
231 		for (i = 0; i < res_cnt; i++)
232 			creates_stddev += (creates_mean - res[i].hits / 1000.0) *
233 				       (creates_mean - res[i].hits / 1000.0) /
234 				       (res_cnt - 1.0);
235 		creates_stddev = sqrt(creates_stddev);
236 	}
237 	printf("Summary: creates %8.3lf \u00B1 %5.3lfk/s (%7.3lfk/prod), ",
238 	       creates_mean, creates_stddev, creates_mean / env.producer_cnt);
239 	printf("%4.2lf kmallocs/create\n", (double)total_kmallocs / total_creates);
240 	if (create_owner_errs || skel->bss->create_errs)
241 		printf("%s() errors %ld create_errs %ld\n",
242 		       storage_type == BPF_MAP_TYPE_SK_STORAGE ?
243 		       "socket" : "pthread_create",
244 		       create_owner_errs,
245 		       skel->bss->create_errs);
246 }
247 
248 /* Benchmark performance of creating bpf local storage  */
249 const struct bench bench_local_storage_create = {
250 	.name = "local-storage-create",
251 	.argp = &bench_local_storage_create_argp,
252 	.validate = validate,
253 	.setup = setup,
254 	.producer_thread = producer,
255 	.measure = measure,
256 	.report_progress = report_progress,
257 	.report_final = report_final,
258 };
259