1 // SPDX-License-Identifier: GPL-2.0
2 #include <string.h>
3 #include <netinet/in.h>
4 #include <netinet/tcp.h>
5 #include <linux/bpf.h>
6 #include <bpf/bpf_helpers.h>
7 
8 char _license[] SEC("license") = "GPL";
9 __u32 _version SEC("version") = 1;
10 
11 #ifndef PAGE_SIZE
12 #define PAGE_SIZE 4096
13 #endif
14 
15 #define SOL_CUSTOM			0xdeadbeef
16 
17 struct sockopt_sk {
18 	__u8 val;
19 };
20 
21 struct {
22 	__uint(type, BPF_MAP_TYPE_SK_STORAGE);
23 	__uint(map_flags, BPF_F_NO_PREALLOC);
24 	__type(key, int);
25 	__type(value, struct sockopt_sk);
26 } socket_storage_map SEC(".maps");
27 
28 SEC("cgroup/getsockopt")
_getsockopt(struct bpf_sockopt * ctx)29 int _getsockopt(struct bpf_sockopt *ctx)
30 {
31 	__u8 *optval_end = ctx->optval_end;
32 	__u8 *optval = ctx->optval;
33 	struct sockopt_sk *storage;
34 
35 	if (ctx->level == SOL_IP && ctx->optname == IP_TOS) {
36 		/* Not interested in SOL_IP:IP_TOS;
37 		 * let next BPF program in the cgroup chain or kernel
38 		 * handle it.
39 		 */
40 		ctx->optlen = 0; /* bypass optval>PAGE_SIZE */
41 		return 1;
42 	}
43 
44 	if (ctx->level == SOL_SOCKET && ctx->optname == SO_SNDBUF) {
45 		/* Not interested in SOL_SOCKET:SO_SNDBUF;
46 		 * let next BPF program in the cgroup chain or kernel
47 		 * handle it.
48 		 */
49 		return 1;
50 	}
51 
52 	if (ctx->level == SOL_TCP && ctx->optname == TCP_CONGESTION) {
53 		/* Not interested in SOL_TCP:TCP_CONGESTION;
54 		 * let next BPF program in the cgroup chain or kernel
55 		 * handle it.
56 		 */
57 		return 1;
58 	}
59 
60 	if (ctx->level == SOL_IP && ctx->optname == IP_FREEBIND) {
61 		if (optval + 1 > optval_end)
62 			return 0; /* EPERM, bounds check */
63 
64 		ctx->retval = 0; /* Reset system call return value to zero */
65 
66 		/* Always export 0x55 */
67 		optval[0] = 0x55;
68 		ctx->optlen = 1;
69 
70 		/* Userspace buffer is PAGE_SIZE * 2, but BPF
71 		 * program can only see the first PAGE_SIZE
72 		 * bytes of data.
73 		 */
74 		if (optval_end - optval != PAGE_SIZE)
75 			return 0; /* EPERM, unexpected data size */
76 
77 		return 1;
78 	}
79 
80 	if (ctx->level != SOL_CUSTOM)
81 		return 0; /* EPERM, deny everything except custom level */
82 
83 	if (optval + 1 > optval_end)
84 		return 0; /* EPERM, bounds check */
85 
86 	storage = bpf_sk_storage_get(&socket_storage_map, ctx->sk, 0,
87 				     BPF_SK_STORAGE_GET_F_CREATE);
88 	if (!storage)
89 		return 0; /* EPERM, couldn't get sk storage */
90 
91 	if (!ctx->retval)
92 		return 0; /* EPERM, kernel should not have handled
93 			   * SOL_CUSTOM, something is wrong!
94 			   */
95 	ctx->retval = 0; /* Reset system call return value to zero */
96 
97 	optval[0] = storage->val;
98 	ctx->optlen = 1;
99 
100 	return 1;
101 }
102 
103 SEC("cgroup/setsockopt")
_setsockopt(struct bpf_sockopt * ctx)104 int _setsockopt(struct bpf_sockopt *ctx)
105 {
106 	__u8 *optval_end = ctx->optval_end;
107 	__u8 *optval = ctx->optval;
108 	struct sockopt_sk *storage;
109 
110 	if (ctx->level == SOL_IP && ctx->optname == IP_TOS) {
111 		/* Not interested in SOL_IP:IP_TOS;
112 		 * let next BPF program in the cgroup chain or kernel
113 		 * handle it.
114 		 */
115 		ctx->optlen = 0; /* bypass optval>PAGE_SIZE */
116 		return 1;
117 	}
118 
119 	if (ctx->level == SOL_SOCKET && ctx->optname == SO_SNDBUF) {
120 		/* Overwrite SO_SNDBUF value */
121 
122 		if (optval + sizeof(__u32) > optval_end)
123 			return 0; /* EPERM, bounds check */
124 
125 		*(__u32 *)optval = 0x55AA;
126 		ctx->optlen = 4;
127 
128 		return 1;
129 	}
130 
131 	if (ctx->level == SOL_TCP && ctx->optname == TCP_CONGESTION) {
132 		/* Always use cubic */
133 
134 		if (optval + 5 > optval_end)
135 			return 0; /* EPERM, bounds check */
136 
137 		memcpy(optval, "cubic", 5);
138 		ctx->optlen = 5;
139 
140 		return 1;
141 	}
142 
143 	if (ctx->level == SOL_IP && ctx->optname == IP_FREEBIND) {
144 		/* Original optlen is larger than PAGE_SIZE. */
145 		if (ctx->optlen != PAGE_SIZE * 2)
146 			return 0; /* EPERM, unexpected data size */
147 
148 		if (optval + 1 > optval_end)
149 			return 0; /* EPERM, bounds check */
150 
151 		/* Make sure we can trim the buffer. */
152 		optval[0] = 0;
153 		ctx->optlen = 1;
154 
155 		/* Usepace buffer is PAGE_SIZE * 2, but BPF
156 		 * program can only see the first PAGE_SIZE
157 		 * bytes of data.
158 		 */
159 		if (optval_end - optval != PAGE_SIZE)
160 			return 0; /* EPERM, unexpected data size */
161 
162 		return 1;
163 	}
164 
165 	if (ctx->level != SOL_CUSTOM)
166 		return 0; /* EPERM, deny everything except custom level */
167 
168 	if (optval + 1 > optval_end)
169 		return 0; /* EPERM, bounds check */
170 
171 	storage = bpf_sk_storage_get(&socket_storage_map, ctx->sk, 0,
172 				     BPF_SK_STORAGE_GET_F_CREATE);
173 	if (!storage)
174 		return 0; /* EPERM, couldn't get sk storage */
175 
176 	storage->val = optval[0];
177 	ctx->optlen = -1; /* BPF has consumed this option, don't call kernel
178 			   * setsockopt handler.
179 			   */
180 
181 	return 1;
182 }
183