bpf_iter.c 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /* Copyright (c) 2020 Facebook */
  3. #include <linux/fs.h>
  4. #include <linux/anon_inodes.h>
  5. #include <linux/filter.h>
  6. #include <linux/bpf.h>
  7. #include <linux/rcupdate_trace.h>
  8. struct bpf_iter_target_info {
  9. struct list_head list;
  10. const struct bpf_iter_reg *reg_info;
  11. u32 btf_id; /* cached value */
  12. };
  13. struct bpf_iter_link {
  14. struct bpf_link link;
  15. struct bpf_iter_aux_info aux;
  16. struct bpf_iter_target_info *tinfo;
  17. };
  18. struct bpf_iter_priv_data {
  19. struct bpf_iter_target_info *tinfo;
  20. const struct bpf_iter_seq_info *seq_info;
  21. struct bpf_prog *prog;
  22. u64 session_id;
  23. u64 seq_num;
  24. bool done_stop;
  25. u8 target_private[] __aligned(8);
  26. };
  27. static struct list_head targets = LIST_HEAD_INIT(targets);
  28. static DEFINE_MUTEX(targets_mutex);
  29. /* protect bpf_iter_link changes */
  30. static DEFINE_MUTEX(link_mutex);
  31. /* incremented on every opened seq_file */
  32. static atomic64_t session_id;
  33. static int prepare_seq_file(struct file *file, struct bpf_iter_link *link,
  34. const struct bpf_iter_seq_info *seq_info);
  35. static void bpf_iter_inc_seq_num(struct seq_file *seq)
  36. {
  37. struct bpf_iter_priv_data *iter_priv;
  38. iter_priv = container_of(seq->private, struct bpf_iter_priv_data,
  39. target_private);
  40. iter_priv->seq_num++;
  41. }
  42. static void bpf_iter_dec_seq_num(struct seq_file *seq)
  43. {
  44. struct bpf_iter_priv_data *iter_priv;
  45. iter_priv = container_of(seq->private, struct bpf_iter_priv_data,
  46. target_private);
  47. iter_priv->seq_num--;
  48. }
  49. static void bpf_iter_done_stop(struct seq_file *seq)
  50. {
  51. struct bpf_iter_priv_data *iter_priv;
  52. iter_priv = container_of(seq->private, struct bpf_iter_priv_data,
  53. target_private);
  54. iter_priv->done_stop = true;
  55. }
  56. static inline bool bpf_iter_target_support_resched(const struct bpf_iter_target_info *tinfo)
  57. {
  58. return tinfo->reg_info->feature & BPF_ITER_RESCHED;
  59. }
  60. static bool bpf_iter_support_resched(struct seq_file *seq)
  61. {
  62. struct bpf_iter_priv_data *iter_priv;
  63. iter_priv = container_of(seq->private, struct bpf_iter_priv_data,
  64. target_private);
  65. return bpf_iter_target_support_resched(iter_priv->tinfo);
  66. }
  67. /* maximum visited objects before bailing out */
  68. #define MAX_ITER_OBJECTS 1000000
  69. /* bpf_seq_read, a customized and simpler version for bpf iterator.
  70. * The following are differences from seq_read():
  71. * . fixed buffer size (PAGE_SIZE)
  72. * . assuming NULL ->llseek()
  73. * . stop() may call bpf program, handling potential overflow there
  74. */
  75. static ssize_t bpf_seq_read(struct file *file, char __user *buf, size_t size,
  76. loff_t *ppos)
  77. {
  78. struct seq_file *seq = file->private_data;
  79. size_t n, offs, copied = 0;
  80. int err = 0, num_objs = 0;
  81. bool can_resched;
  82. void *p;
  83. mutex_lock(&seq->lock);
  84. if (!seq->buf) {
  85. seq->size = PAGE_SIZE << 3;
  86. seq->buf = kvmalloc(seq->size, GFP_KERNEL);
  87. if (!seq->buf) {
  88. err = -ENOMEM;
  89. goto done;
  90. }
  91. }
  92. if (seq->count) {
  93. n = min(seq->count, size);
  94. err = copy_to_user(buf, seq->buf + seq->from, n);
  95. if (err) {
  96. err = -EFAULT;
  97. goto done;
  98. }
  99. seq->count -= n;
  100. seq->from += n;
  101. copied = n;
  102. goto done;
  103. }
  104. seq->from = 0;
  105. p = seq->op->start(seq, &seq->index);
  106. if (!p)
  107. goto stop;
  108. if (IS_ERR(p)) {
  109. err = PTR_ERR(p);
  110. seq->op->stop(seq, p);
  111. seq->count = 0;
  112. goto done;
  113. }
  114. err = seq->op->show(seq, p);
  115. if (err > 0) {
  116. /* object is skipped, decrease seq_num, so next
  117. * valid object can reuse the same seq_num.
  118. */
  119. bpf_iter_dec_seq_num(seq);
  120. seq->count = 0;
  121. } else if (err < 0 || seq_has_overflowed(seq)) {
  122. if (!err)
  123. err = -E2BIG;
  124. seq->op->stop(seq, p);
  125. seq->count = 0;
  126. goto done;
  127. }
  128. can_resched = bpf_iter_support_resched(seq);
  129. while (1) {
  130. loff_t pos = seq->index;
  131. num_objs++;
  132. offs = seq->count;
  133. p = seq->op->next(seq, p, &seq->index);
  134. if (pos == seq->index) {
  135. pr_info_ratelimited("buggy seq_file .next function %ps "
  136. "did not updated position index\n",
  137. seq->op->next);
  138. seq->index++;
  139. }
  140. if (IS_ERR_OR_NULL(p))
  141. break;
  142. /* got a valid next object, increase seq_num */
  143. bpf_iter_inc_seq_num(seq);
  144. if (seq->count >= size)
  145. break;
  146. if (num_objs >= MAX_ITER_OBJECTS) {
  147. if (offs == 0) {
  148. err = -EAGAIN;
  149. seq->op->stop(seq, p);
  150. goto done;
  151. }
  152. break;
  153. }
  154. err = seq->op->show(seq, p);
  155. if (err > 0) {
  156. bpf_iter_dec_seq_num(seq);
  157. seq->count = offs;
  158. } else if (err < 0 || seq_has_overflowed(seq)) {
  159. seq->count = offs;
  160. if (offs == 0) {
  161. if (!err)
  162. err = -E2BIG;
  163. seq->op->stop(seq, p);
  164. goto done;
  165. }
  166. break;
  167. }
  168. if (can_resched)
  169. cond_resched();
  170. }
  171. stop:
  172. offs = seq->count;
  173. if (IS_ERR(p)) {
  174. seq->op->stop(seq, NULL);
  175. err = PTR_ERR(p);
  176. goto done;
  177. }
  178. /* bpf program called if !p */
  179. seq->op->stop(seq, p);
  180. if (!p) {
  181. if (!seq_has_overflowed(seq)) {
  182. bpf_iter_done_stop(seq);
  183. } else {
  184. seq->count = offs;
  185. if (offs == 0) {
  186. err = -E2BIG;
  187. goto done;
  188. }
  189. }
  190. }
  191. n = min(seq->count, size);
  192. err = copy_to_user(buf, seq->buf, n);
  193. if (err) {
  194. err = -EFAULT;
  195. goto done;
  196. }
  197. copied = n;
  198. seq->count -= n;
  199. seq->from = n;
  200. done:
  201. if (!copied)
  202. copied = err;
  203. else
  204. *ppos += copied;
  205. mutex_unlock(&seq->lock);
  206. return copied;
  207. }
  208. static const struct bpf_iter_seq_info *
  209. __get_seq_info(struct bpf_iter_link *link)
  210. {
  211. const struct bpf_iter_seq_info *seq_info;
  212. if (link->aux.map) {
  213. seq_info = link->aux.map->ops->iter_seq_info;
  214. if (seq_info)
  215. return seq_info;
  216. }
  217. return link->tinfo->reg_info->seq_info;
  218. }
  219. static int iter_open(struct inode *inode, struct file *file)
  220. {
  221. struct bpf_iter_link *link = inode->i_private;
  222. return prepare_seq_file(file, link, __get_seq_info(link));
  223. }
  224. static int iter_release(struct inode *inode, struct file *file)
  225. {
  226. struct bpf_iter_priv_data *iter_priv;
  227. struct seq_file *seq;
  228. seq = file->private_data;
  229. if (!seq)
  230. return 0;
  231. iter_priv = container_of(seq->private, struct bpf_iter_priv_data,
  232. target_private);
  233. if (iter_priv->seq_info->fini_seq_private)
  234. iter_priv->seq_info->fini_seq_private(seq->private);
  235. bpf_prog_put(iter_priv->prog);
  236. seq->private = iter_priv;
  237. return seq_release_private(inode, file);
  238. }
  239. const struct file_operations bpf_iter_fops = {
  240. .open = iter_open,
  241. .llseek = no_llseek,
  242. .read = bpf_seq_read,
  243. .release = iter_release,
  244. };
  245. /* The argument reg_info will be cached in bpf_iter_target_info.
  246. * The common practice is to declare target reg_info as
  247. * a const static variable and passed as an argument to
  248. * bpf_iter_reg_target().
  249. */
  250. int bpf_iter_reg_target(const struct bpf_iter_reg *reg_info)
  251. {
  252. struct bpf_iter_target_info *tinfo;
  253. tinfo = kzalloc(sizeof(*tinfo), GFP_KERNEL);
  254. if (!tinfo)
  255. return -ENOMEM;
  256. tinfo->reg_info = reg_info;
  257. INIT_LIST_HEAD(&tinfo->list);
  258. mutex_lock(&targets_mutex);
  259. list_add(&tinfo->list, &targets);
  260. mutex_unlock(&targets_mutex);
  261. return 0;
  262. }
  263. void bpf_iter_unreg_target(const struct bpf_iter_reg *reg_info)
  264. {
  265. struct bpf_iter_target_info *tinfo;
  266. bool found = false;
  267. mutex_lock(&targets_mutex);
  268. list_for_each_entry(tinfo, &targets, list) {
  269. if (reg_info == tinfo->reg_info) {
  270. list_del(&tinfo->list);
  271. kfree(tinfo);
  272. found = true;
  273. break;
  274. }
  275. }
  276. mutex_unlock(&targets_mutex);
  277. WARN_ON(found == false);
  278. }
  279. static void cache_btf_id(struct bpf_iter_target_info *tinfo,
  280. struct bpf_prog *prog)
  281. {
  282. tinfo->btf_id = prog->aux->attach_btf_id;
  283. }
  284. bool bpf_iter_prog_supported(struct bpf_prog *prog)
  285. {
  286. const char *attach_fname = prog->aux->attach_func_name;
  287. struct bpf_iter_target_info *tinfo = NULL, *iter;
  288. u32 prog_btf_id = prog->aux->attach_btf_id;
  289. const char *prefix = BPF_ITER_FUNC_PREFIX;
  290. int prefix_len = strlen(prefix);
  291. if (strncmp(attach_fname, prefix, prefix_len))
  292. return false;
  293. mutex_lock(&targets_mutex);
  294. list_for_each_entry(iter, &targets, list) {
  295. if (iter->btf_id && iter->btf_id == prog_btf_id) {
  296. tinfo = iter;
  297. break;
  298. }
  299. if (!strcmp(attach_fname + prefix_len, iter->reg_info->target)) {
  300. cache_btf_id(iter, prog);
  301. tinfo = iter;
  302. break;
  303. }
  304. }
  305. mutex_unlock(&targets_mutex);
  306. if (tinfo) {
  307. prog->aux->ctx_arg_info_size = tinfo->reg_info->ctx_arg_info_size;
  308. prog->aux->ctx_arg_info = tinfo->reg_info->ctx_arg_info;
  309. }
  310. return tinfo != NULL;
  311. }
  312. const struct bpf_func_proto *
  313. bpf_iter_get_func_proto(enum bpf_func_id func_id, const struct bpf_prog *prog)
  314. {
  315. const struct bpf_iter_target_info *tinfo;
  316. const struct bpf_func_proto *fn = NULL;
  317. mutex_lock(&targets_mutex);
  318. list_for_each_entry(tinfo, &targets, list) {
  319. if (tinfo->btf_id == prog->aux->attach_btf_id) {
  320. const struct bpf_iter_reg *reg_info;
  321. reg_info = tinfo->reg_info;
  322. if (reg_info->get_func_proto)
  323. fn = reg_info->get_func_proto(func_id, prog);
  324. break;
  325. }
  326. }
  327. mutex_unlock(&targets_mutex);
  328. return fn;
  329. }
  330. static void bpf_iter_link_release(struct bpf_link *link)
  331. {
  332. struct bpf_iter_link *iter_link =
  333. container_of(link, struct bpf_iter_link, link);
  334. if (iter_link->tinfo->reg_info->detach_target)
  335. iter_link->tinfo->reg_info->detach_target(&iter_link->aux);
  336. }
  337. static void bpf_iter_link_dealloc(struct bpf_link *link)
  338. {
  339. struct bpf_iter_link *iter_link =
  340. container_of(link, struct bpf_iter_link, link);
  341. kfree(iter_link);
  342. }
  343. static int bpf_iter_link_replace(struct bpf_link *link,
  344. struct bpf_prog *new_prog,
  345. struct bpf_prog *old_prog)
  346. {
  347. int ret = 0;
  348. mutex_lock(&link_mutex);
  349. if (old_prog && link->prog != old_prog) {
  350. ret = -EPERM;
  351. goto out_unlock;
  352. }
  353. if (link->prog->type != new_prog->type ||
  354. link->prog->expected_attach_type != new_prog->expected_attach_type ||
  355. link->prog->aux->attach_btf_id != new_prog->aux->attach_btf_id) {
  356. ret = -EINVAL;
  357. goto out_unlock;
  358. }
  359. old_prog = xchg(&link->prog, new_prog);
  360. bpf_prog_put(old_prog);
  361. out_unlock:
  362. mutex_unlock(&link_mutex);
  363. return ret;
  364. }
  365. static void bpf_iter_link_show_fdinfo(const struct bpf_link *link,
  366. struct seq_file *seq)
  367. {
  368. struct bpf_iter_link *iter_link =
  369. container_of(link, struct bpf_iter_link, link);
  370. bpf_iter_show_fdinfo_t show_fdinfo;
  371. seq_printf(seq,
  372. "target_name:\t%s\n",
  373. iter_link->tinfo->reg_info->target);
  374. show_fdinfo = iter_link->tinfo->reg_info->show_fdinfo;
  375. if (show_fdinfo)
  376. show_fdinfo(&iter_link->aux, seq);
  377. }
  378. static int bpf_iter_link_fill_link_info(const struct bpf_link *link,
  379. struct bpf_link_info *info)
  380. {
  381. struct bpf_iter_link *iter_link =
  382. container_of(link, struct bpf_iter_link, link);
  383. char __user *ubuf = u64_to_user_ptr(info->iter.target_name);
  384. bpf_iter_fill_link_info_t fill_link_info;
  385. u32 ulen = info->iter.target_name_len;
  386. const char *target_name;
  387. u32 target_len;
  388. if (!ulen ^ !ubuf)
  389. return -EINVAL;
  390. target_name = iter_link->tinfo->reg_info->target;
  391. target_len = strlen(target_name);
  392. info->iter.target_name_len = target_len + 1;
  393. if (ubuf) {
  394. if (ulen >= target_len + 1) {
  395. if (copy_to_user(ubuf, target_name, target_len + 1))
  396. return -EFAULT;
  397. } else {
  398. char zero = '\0';
  399. if (copy_to_user(ubuf, target_name, ulen - 1))
  400. return -EFAULT;
  401. if (put_user(zero, ubuf + ulen - 1))
  402. return -EFAULT;
  403. return -ENOSPC;
  404. }
  405. }
  406. fill_link_info = iter_link->tinfo->reg_info->fill_link_info;
  407. if (fill_link_info)
  408. return fill_link_info(&iter_link->aux, info);
  409. return 0;
  410. }
  411. static const struct bpf_link_ops bpf_iter_link_lops = {
  412. .release = bpf_iter_link_release,
  413. .dealloc = bpf_iter_link_dealloc,
  414. .update_prog = bpf_iter_link_replace,
  415. .show_fdinfo = bpf_iter_link_show_fdinfo,
  416. .fill_link_info = bpf_iter_link_fill_link_info,
  417. };
  418. bool bpf_link_is_iter(struct bpf_link *link)
  419. {
  420. return link->ops == &bpf_iter_link_lops;
  421. }
  422. int bpf_iter_link_attach(const union bpf_attr *attr, bpfptr_t uattr,
  423. struct bpf_prog *prog)
  424. {
  425. struct bpf_iter_target_info *tinfo = NULL, *iter;
  426. struct bpf_link_primer link_primer;
  427. union bpf_iter_link_info linfo;
  428. struct bpf_iter_link *link;
  429. u32 prog_btf_id, linfo_len;
  430. bpfptr_t ulinfo;
  431. int err;
  432. if (attr->link_create.target_fd || attr->link_create.flags)
  433. return -EINVAL;
  434. memset(&linfo, 0, sizeof(union bpf_iter_link_info));
  435. ulinfo = make_bpfptr(attr->link_create.iter_info, uattr.is_kernel);
  436. linfo_len = attr->link_create.iter_info_len;
  437. if (bpfptr_is_null(ulinfo) ^ !linfo_len)
  438. return -EINVAL;
  439. if (!bpfptr_is_null(ulinfo)) {
  440. err = bpf_check_uarg_tail_zero(ulinfo, sizeof(linfo),
  441. linfo_len);
  442. if (err)
  443. return err;
  444. linfo_len = min_t(u32, linfo_len, sizeof(linfo));
  445. if (copy_from_bpfptr(&linfo, ulinfo, linfo_len))
  446. return -EFAULT;
  447. }
  448. prog_btf_id = prog->aux->attach_btf_id;
  449. mutex_lock(&targets_mutex);
  450. list_for_each_entry(iter, &targets, list) {
  451. if (iter->btf_id == prog_btf_id) {
  452. tinfo = iter;
  453. break;
  454. }
  455. }
  456. mutex_unlock(&targets_mutex);
  457. if (!tinfo)
  458. return -ENOENT;
  459. /* Only allow sleepable program for resched-able iterator */
  460. if (prog->aux->sleepable && !bpf_iter_target_support_resched(tinfo))
  461. return -EINVAL;
  462. link = kzalloc(sizeof(*link), GFP_USER | __GFP_NOWARN);
  463. if (!link)
  464. return -ENOMEM;
  465. bpf_link_init(&link->link, BPF_LINK_TYPE_ITER, &bpf_iter_link_lops, prog);
  466. link->tinfo = tinfo;
  467. err = bpf_link_prime(&link->link, &link_primer);
  468. if (err) {
  469. kfree(link);
  470. return err;
  471. }
  472. if (tinfo->reg_info->attach_target) {
  473. err = tinfo->reg_info->attach_target(prog, &linfo, &link->aux);
  474. if (err) {
  475. bpf_link_cleanup(&link_primer);
  476. return err;
  477. }
  478. }
  479. return bpf_link_settle(&link_primer);
  480. }
  481. static void init_seq_meta(struct bpf_iter_priv_data *priv_data,
  482. struct bpf_iter_target_info *tinfo,
  483. const struct bpf_iter_seq_info *seq_info,
  484. struct bpf_prog *prog)
  485. {
  486. priv_data->tinfo = tinfo;
  487. priv_data->seq_info = seq_info;
  488. priv_data->prog = prog;
  489. priv_data->session_id = atomic64_inc_return(&session_id);
  490. priv_data->seq_num = 0;
  491. priv_data->done_stop = false;
  492. }
  493. static int prepare_seq_file(struct file *file, struct bpf_iter_link *link,
  494. const struct bpf_iter_seq_info *seq_info)
  495. {
  496. struct bpf_iter_priv_data *priv_data;
  497. struct bpf_iter_target_info *tinfo;
  498. struct bpf_prog *prog;
  499. u32 total_priv_dsize;
  500. struct seq_file *seq;
  501. int err = 0;
  502. mutex_lock(&link_mutex);
  503. prog = link->link.prog;
  504. bpf_prog_inc(prog);
  505. mutex_unlock(&link_mutex);
  506. tinfo = link->tinfo;
  507. total_priv_dsize = offsetof(struct bpf_iter_priv_data, target_private) +
  508. seq_info->seq_priv_size;
  509. priv_data = __seq_open_private(file, seq_info->seq_ops,
  510. total_priv_dsize);
  511. if (!priv_data) {
  512. err = -ENOMEM;
  513. goto release_prog;
  514. }
  515. if (seq_info->init_seq_private) {
  516. err = seq_info->init_seq_private(priv_data->target_private, &link->aux);
  517. if (err)
  518. goto release_seq_file;
  519. }
  520. init_seq_meta(priv_data, tinfo, seq_info, prog);
  521. seq = file->private_data;
  522. seq->private = priv_data->target_private;
  523. return 0;
  524. release_seq_file:
  525. seq_release_private(file->f_inode, file);
  526. file->private_data = NULL;
  527. release_prog:
  528. bpf_prog_put(prog);
  529. return err;
  530. }
  531. int bpf_iter_new_fd(struct bpf_link *link)
  532. {
  533. struct bpf_iter_link *iter_link;
  534. struct file *file;
  535. unsigned int flags;
  536. int err, fd;
  537. if (link->ops != &bpf_iter_link_lops)
  538. return -EINVAL;
  539. flags = O_RDONLY | O_CLOEXEC;
  540. fd = get_unused_fd_flags(flags);
  541. if (fd < 0)
  542. return fd;
  543. file = anon_inode_getfile("bpf_iter", &bpf_iter_fops, NULL, flags);
  544. if (IS_ERR(file)) {
  545. err = PTR_ERR(file);
  546. goto free_fd;
  547. }
  548. iter_link = container_of(link, struct bpf_iter_link, link);
  549. err = prepare_seq_file(file, iter_link, __get_seq_info(iter_link));
  550. if (err)
  551. goto free_file;
  552. fd_install(fd, file);
  553. return fd;
  554. free_file:
  555. fput(file);
  556. free_fd:
  557. put_unused_fd(fd);
  558. return err;
  559. }
  560. struct bpf_prog *bpf_iter_get_info(struct bpf_iter_meta *meta, bool in_stop)
  561. {
  562. struct bpf_iter_priv_data *iter_priv;
  563. struct seq_file *seq;
  564. void *seq_priv;
  565. seq = meta->seq;
  566. if (seq->file->f_op != &bpf_iter_fops)
  567. return NULL;
  568. seq_priv = seq->private;
  569. iter_priv = container_of(seq_priv, struct bpf_iter_priv_data,
  570. target_private);
  571. if (in_stop && iter_priv->done_stop)
  572. return NULL;
  573. meta->session_id = iter_priv->session_id;
  574. meta->seq_num = iter_priv->seq_num;
  575. return iter_priv->prog;
  576. }
  577. int bpf_iter_run_prog(struct bpf_prog *prog, void *ctx)
  578. {
  579. struct bpf_run_ctx run_ctx, *old_run_ctx;
  580. int ret;
  581. if (prog->aux->sleepable) {
  582. rcu_read_lock_trace();
  583. migrate_disable();
  584. might_fault();
  585. old_run_ctx = bpf_set_run_ctx(&run_ctx);
  586. ret = bpf_prog_run(prog, ctx);
  587. bpf_reset_run_ctx(old_run_ctx);
  588. migrate_enable();
  589. rcu_read_unlock_trace();
  590. } else {
  591. rcu_read_lock();
  592. migrate_disable();
  593. old_run_ctx = bpf_set_run_ctx(&run_ctx);
  594. ret = bpf_prog_run(prog, ctx);
  595. bpf_reset_run_ctx(old_run_ctx);
  596. migrate_enable();
  597. rcu_read_unlock();
  598. }
  599. /* bpf program can only return 0 or 1:
  600. * 0 : okay
  601. * 1 : retry the same object
  602. * The bpf_iter_run_prog() return value
  603. * will be seq_ops->show() return value.
  604. */
  605. return ret == 0 ? 0 : -EAGAIN;
  606. }
  607. BPF_CALL_4(bpf_for_each_map_elem, struct bpf_map *, map, void *, callback_fn,
  608. void *, callback_ctx, u64, flags)
  609. {
  610. return map->ops->map_for_each_callback(map, callback_fn, callback_ctx, flags);
  611. }
  612. const struct bpf_func_proto bpf_for_each_map_elem_proto = {
  613. .func = bpf_for_each_map_elem,
  614. .gpl_only = false,
  615. .ret_type = RET_INTEGER,
  616. .arg1_type = ARG_CONST_MAP_PTR,
  617. .arg2_type = ARG_PTR_TO_FUNC,
  618. .arg3_type = ARG_PTR_TO_STACK_OR_NULL,
  619. .arg4_type = ARG_ANYTHING,
  620. };
  621. BPF_CALL_4(bpf_loop, u32, nr_loops, void *, callback_fn, void *, callback_ctx,
  622. u64, flags)
  623. {
  624. bpf_callback_t callback = (bpf_callback_t)callback_fn;
  625. u64 ret;
  626. u32 i;
  627. /* Note: these safety checks are also verified when bpf_loop
  628. * is inlined, be careful to modify this code in sync. See
  629. * function verifier.c:inline_bpf_loop.
  630. */
  631. if (flags)
  632. return -EINVAL;
  633. if (nr_loops > BPF_MAX_LOOPS)
  634. return -E2BIG;
  635. for (i = 0; i < nr_loops; i++) {
  636. ret = callback((u64)i, (u64)(long)callback_ctx, 0, 0, 0);
  637. /* return value: 0 - continue, 1 - stop and return */
  638. if (ret)
  639. return i + 1;
  640. }
  641. return i;
  642. }
  643. const struct bpf_func_proto bpf_loop_proto = {
  644. .func = bpf_loop,
  645. .gpl_only = false,
  646. .ret_type = RET_INTEGER,
  647. .arg1_type = ARG_ANYTHING,
  648. .arg2_type = ARG_PTR_TO_FUNC,
  649. .arg3_type = ARG_PTR_TO_STACK_OR_NULL,
  650. .arg4_type = ARG_ANYTHING,
  651. };