memcontrol.h 45 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887
  1. /* SPDX-License-Identifier: GPL-2.0-or-later */
  2. /* memcontrol.h - Memory Controller
  3. *
  4. * Copyright IBM Corporation, 2007
  5. * Author Balbir Singh <[email protected]>
  6. *
  7. * Copyright 2007 OpenVZ SWsoft Inc
  8. * Author: Pavel Emelianov <[email protected]>
  9. */
  10. #ifndef _LINUX_MEMCONTROL_H
  11. #define _LINUX_MEMCONTROL_H
  12. #include <linux/cgroup.h>
  13. #include <linux/vm_event_item.h>
  14. #include <linux/hardirq.h>
  15. #include <linux/jump_label.h>
  16. #include <linux/page_counter.h>
  17. #include <linux/vmpressure.h>
  18. #include <linux/eventfd.h>
  19. #include <linux/mm.h>
  20. #include <linux/vmstat.h>
  21. #include <linux/writeback.h>
  22. #include <linux/page-flags.h>
  23. struct mem_cgroup;
  24. struct obj_cgroup;
  25. struct page;
  26. struct mm_struct;
  27. struct kmem_cache;
  28. /* Cgroup-specific page state, on top of universal node page state */
  29. enum memcg_stat_item {
  30. MEMCG_SWAP = NR_VM_NODE_STAT_ITEMS,
  31. MEMCG_SOCK,
  32. MEMCG_PERCPU_B,
  33. MEMCG_VMALLOC,
  34. MEMCG_KMEM,
  35. MEMCG_ZSWAP_B,
  36. MEMCG_ZSWAPPED,
  37. MEMCG_NR_STAT,
  38. };
  39. enum memcg_memory_event {
  40. MEMCG_LOW,
  41. MEMCG_HIGH,
  42. MEMCG_MAX,
  43. MEMCG_OOM,
  44. MEMCG_OOM_KILL,
  45. MEMCG_OOM_GROUP_KILL,
  46. MEMCG_SWAP_HIGH,
  47. MEMCG_SWAP_MAX,
  48. MEMCG_SWAP_FAIL,
  49. MEMCG_NR_MEMORY_EVENTS,
  50. };
  51. struct mem_cgroup_reclaim_cookie {
  52. pg_data_t *pgdat;
  53. unsigned int generation;
  54. };
  55. #ifdef CONFIG_MEMCG
  56. #define MEM_CGROUP_ID_SHIFT 16
  57. #define MEM_CGROUP_ID_MAX USHRT_MAX
  58. struct mem_cgroup_id {
  59. int id;
  60. refcount_t ref;
  61. };
  62. /*
  63. * Per memcg event counter is incremented at every pagein/pageout. With THP,
  64. * it will be incremented by the number of pages. This counter is used
  65. * to trigger some periodic events. This is straightforward and better
  66. * than using jiffies etc. to handle periodic memcg event.
  67. */
  68. enum mem_cgroup_events_target {
  69. MEM_CGROUP_TARGET_THRESH,
  70. MEM_CGROUP_TARGET_SOFTLIMIT,
  71. MEM_CGROUP_NTARGETS,
  72. };
  73. struct memcg_vmstats_percpu;
  74. struct memcg_vmstats;
  75. struct mem_cgroup_reclaim_iter {
  76. struct mem_cgroup *position;
  77. /* scan generation, increased every round-trip */
  78. unsigned int generation;
  79. };
  80. /*
  81. * Bitmap and deferred work of shrinker::id corresponding to memcg-aware
  82. * shrinkers, which have elements charged to this memcg.
  83. */
  84. struct shrinker_info {
  85. struct rcu_head rcu;
  86. atomic_long_t *nr_deferred;
  87. unsigned long *map;
  88. };
  89. struct lruvec_stats_percpu {
  90. /* Local (CPU and cgroup) state */
  91. long state[NR_VM_NODE_STAT_ITEMS];
  92. /* Delta calculation for lockless upward propagation */
  93. long state_prev[NR_VM_NODE_STAT_ITEMS];
  94. };
  95. struct lruvec_stats {
  96. /* Aggregated (CPU and subtree) state */
  97. long state[NR_VM_NODE_STAT_ITEMS];
  98. /* Pending child counts during tree propagation */
  99. long state_pending[NR_VM_NODE_STAT_ITEMS];
  100. };
  101. /*
  102. * per-node information in memory controller.
  103. */
  104. struct mem_cgroup_per_node {
  105. struct lruvec lruvec;
  106. struct lruvec_stats_percpu __percpu *lruvec_stats_percpu;
  107. struct lruvec_stats lruvec_stats;
  108. unsigned long lru_zone_size[MAX_NR_ZONES][NR_LRU_LISTS];
  109. struct mem_cgroup_reclaim_iter iter;
  110. struct shrinker_info __rcu *shrinker_info;
  111. struct rb_node tree_node; /* RB tree node */
  112. unsigned long usage_in_excess;/* Set to the value by which */
  113. /* the soft limit is exceeded*/
  114. bool on_tree;
  115. struct mem_cgroup *memcg; /* Back pointer, we cannot */
  116. /* use container_of */
  117. };
  118. struct mem_cgroup_threshold {
  119. struct eventfd_ctx *eventfd;
  120. unsigned long threshold;
  121. };
  122. /* For threshold */
  123. struct mem_cgroup_threshold_ary {
  124. /* An array index points to threshold just below or equal to usage. */
  125. int current_threshold;
  126. /* Size of entries[] */
  127. unsigned int size;
  128. /* Array of thresholds */
  129. struct mem_cgroup_threshold entries[];
  130. };
  131. struct mem_cgroup_thresholds {
  132. /* Primary thresholds array */
  133. struct mem_cgroup_threshold_ary *primary;
  134. /*
  135. * Spare threshold array.
  136. * This is needed to make mem_cgroup_unregister_event() "never fail".
  137. * It must be able to store at least primary->size - 1 entries.
  138. */
  139. struct mem_cgroup_threshold_ary *spare;
  140. };
  141. /*
  142. * Remember four most recent foreign writebacks with dirty pages in this
  143. * cgroup. Inode sharing is expected to be uncommon and, even if we miss
  144. * one in a given round, we're likely to catch it later if it keeps
  145. * foreign-dirtying, so a fairly low count should be enough.
  146. *
  147. * See mem_cgroup_track_foreign_dirty_slowpath() for details.
  148. */
  149. #define MEMCG_CGWB_FRN_CNT 4
  150. struct memcg_cgwb_frn {
  151. u64 bdi_id; /* bdi->id of the foreign inode */
  152. int memcg_id; /* memcg->css.id of foreign inode */
  153. u64 at; /* jiffies_64 at the time of dirtying */
  154. struct wb_completion done; /* tracks in-flight foreign writebacks */
  155. };
  156. /*
  157. * Bucket for arbitrarily byte-sized objects charged to a memory
  158. * cgroup. The bucket can be reparented in one piece when the cgroup
  159. * is destroyed, without having to round up the individual references
  160. * of all live memory objects in the wild.
  161. */
  162. struct obj_cgroup {
  163. struct percpu_ref refcnt;
  164. struct mem_cgroup *memcg;
  165. atomic_t nr_charged_bytes;
  166. union {
  167. struct list_head list; /* protected by objcg_lock */
  168. struct rcu_head rcu;
  169. };
  170. };
  171. /*
  172. * The memory controller data structure. The memory controller controls both
  173. * page cache and RSS per cgroup. We would eventually like to provide
  174. * statistics based on the statistics developed by Rik Van Riel for clock-pro,
  175. * to help the administrator determine what knobs to tune.
  176. */
  177. struct mem_cgroup {
  178. struct cgroup_subsys_state css;
  179. /* Private memcg ID. Used to ID objects that outlive the cgroup */
  180. struct mem_cgroup_id id;
  181. /* Accounted resources */
  182. struct page_counter memory; /* Both v1 & v2 */
  183. union {
  184. struct page_counter swap; /* v2 only */
  185. struct page_counter memsw; /* v1 only */
  186. };
  187. /* Legacy consumer-oriented counters */
  188. struct page_counter kmem; /* v1 only */
  189. struct page_counter tcpmem; /* v1 only */
  190. /* Range enforcement for interrupt charges */
  191. struct work_struct high_work;
  192. #if defined(CONFIG_MEMCG_KMEM) && defined(CONFIG_ZSWAP)
  193. unsigned long zswap_max;
  194. #endif
  195. unsigned long soft_limit;
  196. /* vmpressure notifications */
  197. struct vmpressure vmpressure;
  198. /*
  199. * Should the OOM killer kill all belonging tasks, had it kill one?
  200. */
  201. bool oom_group;
  202. /* protected by memcg_oom_lock */
  203. bool oom_lock;
  204. int under_oom;
  205. int swappiness;
  206. /* OOM-Killer disable */
  207. int oom_kill_disable;
  208. /* memory.events and memory.events.local */
  209. struct cgroup_file events_file;
  210. struct cgroup_file events_local_file;
  211. /* handle for "memory.swap.events" */
  212. struct cgroup_file swap_events_file;
  213. /* protect arrays of thresholds */
  214. struct mutex thresholds_lock;
  215. /* thresholds for memory usage. RCU-protected */
  216. struct mem_cgroup_thresholds thresholds;
  217. /* thresholds for mem+swap usage. RCU-protected */
  218. struct mem_cgroup_thresholds memsw_thresholds;
  219. /* For oom notifier event fd */
  220. struct list_head oom_notify;
  221. /*
  222. * Should we move charges of a task when a task is moved into this
  223. * mem_cgroup ? And what type of charges should we move ?
  224. */
  225. unsigned long move_charge_at_immigrate;
  226. /* taken only while moving_account > 0 */
  227. spinlock_t move_lock;
  228. unsigned long move_lock_flags;
  229. CACHELINE_PADDING(_pad1_);
  230. /* memory.stat */
  231. struct memcg_vmstats *vmstats;
  232. /* memory.events */
  233. atomic_long_t memory_events[MEMCG_NR_MEMORY_EVENTS];
  234. atomic_long_t memory_events_local[MEMCG_NR_MEMORY_EVENTS];
  235. /*
  236. * Hint of reclaim pressure for socket memroy management. Note
  237. * that this indicator should NOT be used in legacy cgroup mode
  238. * where socket memory is accounted/charged separately.
  239. */
  240. unsigned long socket_pressure;
  241. /* Legacy tcp memory accounting */
  242. bool tcpmem_active;
  243. int tcpmem_pressure;
  244. #ifdef CONFIG_MEMCG_KMEM
  245. int kmemcg_id;
  246. struct obj_cgroup __rcu *objcg;
  247. /* list of inherited objcgs, protected by objcg_lock */
  248. struct list_head objcg_list;
  249. #endif
  250. CACHELINE_PADDING(_pad2_);
  251. /*
  252. * set > 0 if pages under this cgroup are moving to other cgroup.
  253. */
  254. atomic_t moving_account;
  255. struct task_struct *move_lock_task;
  256. struct memcg_vmstats_percpu __percpu *vmstats_percpu;
  257. #ifdef CONFIG_CGROUP_WRITEBACK
  258. struct list_head cgwb_list;
  259. struct wb_domain cgwb_domain;
  260. struct memcg_cgwb_frn cgwb_frn[MEMCG_CGWB_FRN_CNT];
  261. #endif
  262. /* List of events which userspace want to receive */
  263. struct list_head event_list;
  264. spinlock_t event_list_lock;
  265. #ifdef CONFIG_TRANSPARENT_HUGEPAGE
  266. struct deferred_split deferred_split_queue;
  267. #endif
  268. #ifdef CONFIG_LRU_GEN
  269. /* per-memcg mm_struct list */
  270. struct lru_gen_mm_list mm_list;
  271. #endif
  272. ANDROID_OEM_DATA_ARRAY(1, 2);
  273. struct mem_cgroup_per_node *nodeinfo[];
  274. };
  275. /*
  276. * size of first charge trial.
  277. * TODO: maybe necessary to use big numbers in big irons or dynamic based of the
  278. * workload.
  279. */
  280. #define MEMCG_CHARGE_BATCH 64U
  281. extern struct mem_cgroup *root_mem_cgroup;
  282. enum page_memcg_data_flags {
  283. /* page->memcg_data is a pointer to an objcgs vector */
  284. MEMCG_DATA_OBJCGS = (1UL << 0),
  285. /* page has been accounted as a non-slab kernel page */
  286. MEMCG_DATA_KMEM = (1UL << 1),
  287. /* the next bit after the last actual flag */
  288. __NR_MEMCG_DATA_FLAGS = (1UL << 2),
  289. };
  290. #define MEMCG_DATA_FLAGS_MASK (__NR_MEMCG_DATA_FLAGS - 1)
  291. static inline bool folio_memcg_kmem(struct folio *folio);
  292. /*
  293. * After the initialization objcg->memcg is always pointing at
  294. * a valid memcg, but can be atomically swapped to the parent memcg.
  295. *
  296. * The caller must ensure that the returned memcg won't be released:
  297. * e.g. acquire the rcu_read_lock or css_set_lock.
  298. */
  299. static inline struct mem_cgroup *obj_cgroup_memcg(struct obj_cgroup *objcg)
  300. {
  301. return READ_ONCE(objcg->memcg);
  302. }
  303. /*
  304. * __folio_memcg - Get the memory cgroup associated with a non-kmem folio
  305. * @folio: Pointer to the folio.
  306. *
  307. * Returns a pointer to the memory cgroup associated with the folio,
  308. * or NULL. This function assumes that the folio is known to have a
  309. * proper memory cgroup pointer. It's not safe to call this function
  310. * against some type of folios, e.g. slab folios or ex-slab folios or
  311. * kmem folios.
  312. */
  313. static inline struct mem_cgroup *__folio_memcg(struct folio *folio)
  314. {
  315. unsigned long memcg_data = folio->memcg_data;
  316. VM_BUG_ON_FOLIO(folio_test_slab(folio), folio);
  317. VM_BUG_ON_FOLIO(memcg_data & MEMCG_DATA_OBJCGS, folio);
  318. VM_BUG_ON_FOLIO(memcg_data & MEMCG_DATA_KMEM, folio);
  319. return (struct mem_cgroup *)(memcg_data & ~MEMCG_DATA_FLAGS_MASK);
  320. }
  321. /*
  322. * __folio_objcg - get the object cgroup associated with a kmem folio.
  323. * @folio: Pointer to the folio.
  324. *
  325. * Returns a pointer to the object cgroup associated with the folio,
  326. * or NULL. This function assumes that the folio is known to have a
  327. * proper object cgroup pointer. It's not safe to call this function
  328. * against some type of folios, e.g. slab folios or ex-slab folios or
  329. * LRU folios.
  330. */
  331. static inline struct obj_cgroup *__folio_objcg(struct folio *folio)
  332. {
  333. unsigned long memcg_data = folio->memcg_data;
  334. VM_BUG_ON_FOLIO(folio_test_slab(folio), folio);
  335. VM_BUG_ON_FOLIO(memcg_data & MEMCG_DATA_OBJCGS, folio);
  336. VM_BUG_ON_FOLIO(!(memcg_data & MEMCG_DATA_KMEM), folio);
  337. return (struct obj_cgroup *)(memcg_data & ~MEMCG_DATA_FLAGS_MASK);
  338. }
  339. /*
  340. * folio_memcg - Get the memory cgroup associated with a folio.
  341. * @folio: Pointer to the folio.
  342. *
  343. * Returns a pointer to the memory cgroup associated with the folio,
  344. * or NULL. This function assumes that the folio is known to have a
  345. * proper memory cgroup pointer. It's not safe to call this function
  346. * against some type of folios, e.g. slab folios or ex-slab folios.
  347. *
  348. * For a non-kmem folio any of the following ensures folio and memcg binding
  349. * stability:
  350. *
  351. * - the folio lock
  352. * - LRU isolation
  353. * - lock_page_memcg()
  354. * - exclusive reference
  355. * - mem_cgroup_trylock_pages()
  356. *
  357. * For a kmem folio a caller should hold an rcu read lock to protect memcg
  358. * associated with a kmem folio from being released.
  359. */
  360. static inline struct mem_cgroup *folio_memcg(struct folio *folio)
  361. {
  362. if (folio_memcg_kmem(folio))
  363. return obj_cgroup_memcg(__folio_objcg(folio));
  364. return __folio_memcg(folio);
  365. }
  366. static inline struct mem_cgroup *page_memcg(struct page *page)
  367. {
  368. return folio_memcg(page_folio(page));
  369. }
  370. /**
  371. * folio_memcg_rcu - Locklessly get the memory cgroup associated with a folio.
  372. * @folio: Pointer to the folio.
  373. *
  374. * This function assumes that the folio is known to have a
  375. * proper memory cgroup pointer. It's not safe to call this function
  376. * against some type of folios, e.g. slab folios or ex-slab folios.
  377. *
  378. * Return: A pointer to the memory cgroup associated with the folio,
  379. * or NULL.
  380. */
  381. static inline struct mem_cgroup *folio_memcg_rcu(struct folio *folio)
  382. {
  383. unsigned long memcg_data = READ_ONCE(folio->memcg_data);
  384. VM_BUG_ON_FOLIO(folio_test_slab(folio), folio);
  385. WARN_ON_ONCE(!rcu_read_lock_held());
  386. if (memcg_data & MEMCG_DATA_KMEM) {
  387. struct obj_cgroup *objcg;
  388. objcg = (void *)(memcg_data & ~MEMCG_DATA_FLAGS_MASK);
  389. return obj_cgroup_memcg(objcg);
  390. }
  391. return (struct mem_cgroup *)(memcg_data & ~MEMCG_DATA_FLAGS_MASK);
  392. }
  393. /*
  394. * page_memcg_check - get the memory cgroup associated with a page
  395. * @page: a pointer to the page struct
  396. *
  397. * Returns a pointer to the memory cgroup associated with the page,
  398. * or NULL. This function unlike page_memcg() can take any page
  399. * as an argument. It has to be used in cases when it's not known if a page
  400. * has an associated memory cgroup pointer or an object cgroups vector or
  401. * an object cgroup.
  402. *
  403. * For a non-kmem page any of the following ensures page and memcg binding
  404. * stability:
  405. *
  406. * - the page lock
  407. * - LRU isolation
  408. * - lock_page_memcg()
  409. * - exclusive reference
  410. * - mem_cgroup_trylock_pages()
  411. *
  412. * For a kmem page a caller should hold an rcu read lock to protect memcg
  413. * associated with a kmem page from being released.
  414. */
  415. static inline struct mem_cgroup *page_memcg_check(struct page *page)
  416. {
  417. /*
  418. * Because page->memcg_data might be changed asynchronously
  419. * for slab pages, READ_ONCE() should be used here.
  420. */
  421. unsigned long memcg_data = READ_ONCE(page->memcg_data);
  422. if (memcg_data & MEMCG_DATA_OBJCGS)
  423. return NULL;
  424. if (memcg_data & MEMCG_DATA_KMEM) {
  425. struct obj_cgroup *objcg;
  426. objcg = (void *)(memcg_data & ~MEMCG_DATA_FLAGS_MASK);
  427. return obj_cgroup_memcg(objcg);
  428. }
  429. return (struct mem_cgroup *)(memcg_data & ~MEMCG_DATA_FLAGS_MASK);
  430. }
  431. static inline struct mem_cgroup *get_mem_cgroup_from_objcg(struct obj_cgroup *objcg)
  432. {
  433. struct mem_cgroup *memcg;
  434. rcu_read_lock();
  435. retry:
  436. memcg = obj_cgroup_memcg(objcg);
  437. if (unlikely(!css_tryget(&memcg->css)))
  438. goto retry;
  439. rcu_read_unlock();
  440. return memcg;
  441. }
  442. #ifdef CONFIG_MEMCG_KMEM
  443. /*
  444. * folio_memcg_kmem - Check if the folio has the memcg_kmem flag set.
  445. * @folio: Pointer to the folio.
  446. *
  447. * Checks if the folio has MemcgKmem flag set. The caller must ensure
  448. * that the folio has an associated memory cgroup. It's not safe to call
  449. * this function against some types of folios, e.g. slab folios.
  450. */
  451. static inline bool folio_memcg_kmem(struct folio *folio)
  452. {
  453. VM_BUG_ON_PGFLAGS(PageTail(&folio->page), &folio->page);
  454. VM_BUG_ON_FOLIO(folio->memcg_data & MEMCG_DATA_OBJCGS, folio);
  455. return folio->memcg_data & MEMCG_DATA_KMEM;
  456. }
  457. #else
  458. static inline bool folio_memcg_kmem(struct folio *folio)
  459. {
  460. return false;
  461. }
  462. #endif
  463. static inline bool PageMemcgKmem(struct page *page)
  464. {
  465. return folio_memcg_kmem(page_folio(page));
  466. }
  467. static inline bool mem_cgroup_is_root(struct mem_cgroup *memcg)
  468. {
  469. return (memcg == root_mem_cgroup);
  470. }
  471. static inline bool mem_cgroup_disabled(void)
  472. {
  473. return !cgroup_subsys_enabled(memory_cgrp_subsys);
  474. }
  475. static inline void mem_cgroup_protection(struct mem_cgroup *root,
  476. struct mem_cgroup *memcg,
  477. unsigned long *min,
  478. unsigned long *low)
  479. {
  480. *min = *low = 0;
  481. if (mem_cgroup_disabled())
  482. return;
  483. /*
  484. * There is no reclaim protection applied to a targeted reclaim.
  485. * We are special casing this specific case here because
  486. * mem_cgroup_protected calculation is not robust enough to keep
  487. * the protection invariant for calculated effective values for
  488. * parallel reclaimers with different reclaim target. This is
  489. * especially a problem for tail memcgs (as they have pages on LRU)
  490. * which would want to have effective values 0 for targeted reclaim
  491. * but a different value for external reclaim.
  492. *
  493. * Example
  494. * Let's have global and A's reclaim in parallel:
  495. * |
  496. * A (low=2G, usage = 3G, max = 3G, children_low_usage = 1.5G)
  497. * |\
  498. * | C (low = 1G, usage = 2.5G)
  499. * B (low = 1G, usage = 0.5G)
  500. *
  501. * For the global reclaim
  502. * A.elow = A.low
  503. * B.elow = min(B.usage, B.low) because children_low_usage <= A.elow
  504. * C.elow = min(C.usage, C.low)
  505. *
  506. * With the effective values resetting we have A reclaim
  507. * A.elow = 0
  508. * B.elow = B.low
  509. * C.elow = C.low
  510. *
  511. * If the global reclaim races with A's reclaim then
  512. * B.elow = C.elow = 0 because children_low_usage > A.elow)
  513. * is possible and reclaiming B would be violating the protection.
  514. *
  515. */
  516. if (root == memcg)
  517. return;
  518. *min = READ_ONCE(memcg->memory.emin);
  519. *low = READ_ONCE(memcg->memory.elow);
  520. }
  521. void mem_cgroup_calculate_protection(struct mem_cgroup *root,
  522. struct mem_cgroup *memcg);
  523. static inline bool mem_cgroup_supports_protection(struct mem_cgroup *memcg)
  524. {
  525. /*
  526. * The root memcg doesn't account charges, and doesn't support
  527. * protection.
  528. */
  529. return !mem_cgroup_disabled() && !mem_cgroup_is_root(memcg);
  530. }
  531. static inline bool mem_cgroup_below_low(struct mem_cgroup *memcg)
  532. {
  533. if (!mem_cgroup_supports_protection(memcg))
  534. return false;
  535. return READ_ONCE(memcg->memory.elow) >=
  536. page_counter_read(&memcg->memory);
  537. }
  538. static inline bool mem_cgroup_below_min(struct mem_cgroup *memcg)
  539. {
  540. if (!mem_cgroup_supports_protection(memcg))
  541. return false;
  542. return READ_ONCE(memcg->memory.emin) >=
  543. page_counter_read(&memcg->memory);
  544. }
  545. int __mem_cgroup_charge(struct folio *folio, struct mm_struct *mm, gfp_t gfp);
  546. /**
  547. * mem_cgroup_charge - Charge a newly allocated folio to a cgroup.
  548. * @folio: Folio to charge.
  549. * @mm: mm context of the allocating task.
  550. * @gfp: Reclaim mode.
  551. *
  552. * Try to charge @folio to the memcg that @mm belongs to, reclaiming
  553. * pages according to @gfp if necessary. If @mm is NULL, try to
  554. * charge to the active memcg.
  555. *
  556. * Do not use this for folios allocated for swapin.
  557. *
  558. * Return: 0 on success. Otherwise, an error code is returned.
  559. */
  560. static inline int mem_cgroup_charge(struct folio *folio, struct mm_struct *mm,
  561. gfp_t gfp)
  562. {
  563. if (mem_cgroup_disabled())
  564. return 0;
  565. return __mem_cgroup_charge(folio, mm, gfp);
  566. }
  567. int mem_cgroup_swapin_charge_folio(struct folio *folio, struct mm_struct *mm,
  568. gfp_t gfp, swp_entry_t entry);
  569. void mem_cgroup_swapin_uncharge_swap(swp_entry_t entry);
  570. void __mem_cgroup_uncharge(struct folio *folio);
  571. /**
  572. * mem_cgroup_uncharge - Uncharge a folio.
  573. * @folio: Folio to uncharge.
  574. *
  575. * Uncharge a folio previously charged with mem_cgroup_charge().
  576. */
  577. static inline void mem_cgroup_uncharge(struct folio *folio)
  578. {
  579. if (mem_cgroup_disabled())
  580. return;
  581. __mem_cgroup_uncharge(folio);
  582. }
  583. void __mem_cgroup_uncharge_list(struct list_head *page_list);
  584. static inline void mem_cgroup_uncharge_list(struct list_head *page_list)
  585. {
  586. if (mem_cgroup_disabled())
  587. return;
  588. __mem_cgroup_uncharge_list(page_list);
  589. }
  590. void mem_cgroup_migrate(struct folio *old, struct folio *new);
  591. /**
  592. * mem_cgroup_lruvec - get the lru list vector for a memcg & node
  593. * @memcg: memcg of the wanted lruvec
  594. * @pgdat: pglist_data
  595. *
  596. * Returns the lru list vector holding pages for a given @memcg &
  597. * @pgdat combination. This can be the node lruvec, if the memory
  598. * controller is disabled.
  599. */
  600. static inline struct lruvec *mem_cgroup_lruvec(struct mem_cgroup *memcg,
  601. struct pglist_data *pgdat)
  602. {
  603. struct mem_cgroup_per_node *mz;
  604. struct lruvec *lruvec;
  605. if (mem_cgroup_disabled()) {
  606. lruvec = &pgdat->__lruvec;
  607. goto out;
  608. }
  609. if (!memcg)
  610. memcg = root_mem_cgroup;
  611. mz = memcg->nodeinfo[pgdat->node_id];
  612. lruvec = &mz->lruvec;
  613. out:
  614. /*
  615. * Since a node can be onlined after the mem_cgroup was created,
  616. * we have to be prepared to initialize lruvec->pgdat here;
  617. * and if offlined then reonlined, we need to reinitialize it.
  618. */
  619. if (unlikely(lruvec->pgdat != pgdat))
  620. lruvec->pgdat = pgdat;
  621. return lruvec;
  622. }
  623. /**
  624. * folio_lruvec - return lruvec for isolating/putting an LRU folio
  625. * @folio: Pointer to the folio.
  626. *
  627. * This function relies on folio->mem_cgroup being stable.
  628. */
  629. static inline struct lruvec *folio_lruvec(struct folio *folio)
  630. {
  631. struct mem_cgroup *memcg = folio_memcg(folio);
  632. VM_WARN_ON_ONCE_FOLIO(!memcg && !mem_cgroup_disabled(), folio);
  633. return mem_cgroup_lruvec(memcg, folio_pgdat(folio));
  634. }
  635. struct mem_cgroup *mem_cgroup_from_task(struct task_struct *p);
  636. struct mem_cgroup *get_mem_cgroup_from_mm(struct mm_struct *mm);
  637. struct lruvec *folio_lruvec_lock(struct folio *folio);
  638. struct lruvec *folio_lruvec_lock_irq(struct folio *folio);
  639. struct lruvec *folio_lruvec_lock_irqsave(struct folio *folio,
  640. unsigned long *flags);
  641. #ifdef CONFIG_DEBUG_VM
  642. void lruvec_memcg_debug(struct lruvec *lruvec, struct folio *folio);
  643. #else
  644. static inline
  645. void lruvec_memcg_debug(struct lruvec *lruvec, struct folio *folio)
  646. {
  647. }
  648. #endif
  649. static inline
  650. struct mem_cgroup *mem_cgroup_from_css(struct cgroup_subsys_state *css){
  651. return css ? container_of(css, struct mem_cgroup, css) : NULL;
  652. }
  653. static inline bool obj_cgroup_tryget(struct obj_cgroup *objcg)
  654. {
  655. return percpu_ref_tryget(&objcg->refcnt);
  656. }
  657. static inline void obj_cgroup_get(struct obj_cgroup *objcg)
  658. {
  659. percpu_ref_get(&objcg->refcnt);
  660. }
  661. static inline void obj_cgroup_get_many(struct obj_cgroup *objcg,
  662. unsigned long nr)
  663. {
  664. percpu_ref_get_many(&objcg->refcnt, nr);
  665. }
  666. static inline void obj_cgroup_put(struct obj_cgroup *objcg)
  667. {
  668. percpu_ref_put(&objcg->refcnt);
  669. }
  670. static inline bool mem_cgroup_tryget(struct mem_cgroup *memcg)
  671. {
  672. return !memcg || css_tryget(&memcg->css);
  673. }
  674. static inline void mem_cgroup_put(struct mem_cgroup *memcg)
  675. {
  676. if (memcg)
  677. css_put(&memcg->css);
  678. }
  679. #define mem_cgroup_from_counter(counter, member) \
  680. container_of(counter, struct mem_cgroup, member)
  681. struct mem_cgroup *mem_cgroup_iter(struct mem_cgroup *,
  682. struct mem_cgroup *,
  683. struct mem_cgroup_reclaim_cookie *);
  684. void mem_cgroup_iter_break(struct mem_cgroup *, struct mem_cgroup *);
  685. int mem_cgroup_scan_tasks(struct mem_cgroup *,
  686. int (*)(struct task_struct *, void *), void *);
  687. static inline unsigned short mem_cgroup_id(struct mem_cgroup *memcg)
  688. {
  689. if (mem_cgroup_disabled())
  690. return 0;
  691. return memcg->id.id;
  692. }
  693. struct mem_cgroup *mem_cgroup_from_id(unsigned short id);
  694. #ifdef CONFIG_SHRINKER_DEBUG
  695. static inline unsigned long mem_cgroup_ino(struct mem_cgroup *memcg)
  696. {
  697. return memcg ? cgroup_ino(memcg->css.cgroup) : 0;
  698. }
  699. struct mem_cgroup *mem_cgroup_get_from_ino(unsigned long ino);
  700. #endif
  701. static inline struct mem_cgroup *mem_cgroup_from_seq(struct seq_file *m)
  702. {
  703. return mem_cgroup_from_css(seq_css(m));
  704. }
  705. static inline struct mem_cgroup *lruvec_memcg(struct lruvec *lruvec)
  706. {
  707. struct mem_cgroup_per_node *mz;
  708. if (mem_cgroup_disabled())
  709. return NULL;
  710. mz = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
  711. return mz->memcg;
  712. }
  713. /**
  714. * parent_mem_cgroup - find the accounting parent of a memcg
  715. * @memcg: memcg whose parent to find
  716. *
  717. * Returns the parent memcg, or NULL if this is the root or the memory
  718. * controller is in legacy no-hierarchy mode.
  719. */
  720. static inline struct mem_cgroup *parent_mem_cgroup(struct mem_cgroup *memcg)
  721. {
  722. return mem_cgroup_from_css(memcg->css.parent);
  723. }
  724. static inline bool mem_cgroup_is_descendant(struct mem_cgroup *memcg,
  725. struct mem_cgroup *root)
  726. {
  727. if (root == memcg)
  728. return true;
  729. return cgroup_is_descendant(memcg->css.cgroup, root->css.cgroup);
  730. }
  731. static inline bool mm_match_cgroup(struct mm_struct *mm,
  732. struct mem_cgroup *memcg)
  733. {
  734. struct mem_cgroup *task_memcg;
  735. bool match = false;
  736. rcu_read_lock();
  737. task_memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
  738. if (task_memcg)
  739. match = mem_cgroup_is_descendant(task_memcg, memcg);
  740. rcu_read_unlock();
  741. return match;
  742. }
  743. struct cgroup_subsys_state *mem_cgroup_css_from_page(struct page *page);
  744. ino_t page_cgroup_ino(struct page *page);
  745. static inline bool mem_cgroup_online(struct mem_cgroup *memcg)
  746. {
  747. if (mem_cgroup_disabled())
  748. return true;
  749. return !!(memcg->css.flags & CSS_ONLINE);
  750. }
  751. void mem_cgroup_update_lru_size(struct lruvec *lruvec, enum lru_list lru,
  752. int zid, int nr_pages);
  753. static inline
  754. unsigned long mem_cgroup_get_zone_lru_size(struct lruvec *lruvec,
  755. enum lru_list lru, int zone_idx)
  756. {
  757. struct mem_cgroup_per_node *mz;
  758. mz = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
  759. return READ_ONCE(mz->lru_zone_size[zone_idx][lru]);
  760. }
  761. void mem_cgroup_handle_over_high(gfp_t gfp_mask);
  762. unsigned long mem_cgroup_get_max(struct mem_cgroup *memcg);
  763. unsigned long mem_cgroup_size(struct mem_cgroup *memcg);
  764. void mem_cgroup_print_oom_context(struct mem_cgroup *memcg,
  765. struct task_struct *p);
  766. void mem_cgroup_print_oom_meminfo(struct mem_cgroup *memcg);
  767. static inline void mem_cgroup_enter_user_fault(void)
  768. {
  769. WARN_ON(current->in_user_fault);
  770. current->in_user_fault = 1;
  771. }
  772. static inline void mem_cgroup_exit_user_fault(void)
  773. {
  774. WARN_ON(!current->in_user_fault);
  775. current->in_user_fault = 0;
  776. }
  777. static inline bool task_in_memcg_oom(struct task_struct *p)
  778. {
  779. return p->memcg_in_oom;
  780. }
  781. bool mem_cgroup_oom_synchronize(bool wait);
  782. struct mem_cgroup *mem_cgroup_get_oom_group(struct task_struct *victim,
  783. struct mem_cgroup *oom_domain);
  784. void mem_cgroup_print_oom_group(struct mem_cgroup *memcg);
  785. void folio_memcg_lock(struct folio *folio);
  786. void folio_memcg_unlock(struct folio *folio);
  787. void lock_page_memcg(struct page *page);
  788. void unlock_page_memcg(struct page *page);
  789. void __mod_memcg_state(struct mem_cgroup *memcg, int idx, int val);
  790. /* try to stablize folio_memcg() for all the pages in a memcg */
  791. static inline bool mem_cgroup_trylock_pages(struct mem_cgroup *memcg)
  792. {
  793. rcu_read_lock();
  794. if (mem_cgroup_disabled() || !atomic_read(&memcg->moving_account))
  795. return true;
  796. rcu_read_unlock();
  797. return false;
  798. }
  799. static inline void mem_cgroup_unlock_pages(void)
  800. {
  801. rcu_read_unlock();
  802. }
  803. /* idx can be of type enum memcg_stat_item or node_stat_item */
  804. static inline void mod_memcg_state(struct mem_cgroup *memcg,
  805. int idx, int val)
  806. {
  807. unsigned long flags;
  808. local_irq_save(flags);
  809. __mod_memcg_state(memcg, idx, val);
  810. local_irq_restore(flags);
  811. }
  812. static inline void mod_memcg_page_state(struct page *page,
  813. int idx, int val)
  814. {
  815. struct mem_cgroup *memcg;
  816. if (mem_cgroup_disabled())
  817. return;
  818. rcu_read_lock();
  819. memcg = page_memcg(page);
  820. if (memcg)
  821. mod_memcg_state(memcg, idx, val);
  822. rcu_read_unlock();
  823. }
  824. unsigned long memcg_page_state(struct mem_cgroup *memcg, int idx);
  825. static inline unsigned long lruvec_page_state(struct lruvec *lruvec,
  826. enum node_stat_item idx)
  827. {
  828. struct mem_cgroup_per_node *pn;
  829. long x;
  830. if (mem_cgroup_disabled())
  831. return node_page_state(lruvec_pgdat(lruvec), idx);
  832. pn = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
  833. x = READ_ONCE(pn->lruvec_stats.state[idx]);
  834. #ifdef CONFIG_SMP
  835. if (x < 0)
  836. x = 0;
  837. #endif
  838. return x;
  839. }
  840. static inline unsigned long lruvec_page_state_local(struct lruvec *lruvec,
  841. enum node_stat_item idx)
  842. {
  843. struct mem_cgroup_per_node *pn;
  844. long x = 0;
  845. int cpu;
  846. if (mem_cgroup_disabled())
  847. return node_page_state(lruvec_pgdat(lruvec), idx);
  848. pn = container_of(lruvec, struct mem_cgroup_per_node, lruvec);
  849. for_each_possible_cpu(cpu)
  850. x += per_cpu(pn->lruvec_stats_percpu->state[idx], cpu);
  851. #ifdef CONFIG_SMP
  852. if (x < 0)
  853. x = 0;
  854. #endif
  855. return x;
  856. }
  857. void mem_cgroup_flush_stats(void);
  858. void mem_cgroup_flush_stats_delayed(void);
  859. void __mod_memcg_lruvec_state(struct lruvec *lruvec, enum node_stat_item idx,
  860. int val);
  861. void __mod_lruvec_kmem_state(void *p, enum node_stat_item idx, int val);
  862. static inline void mod_lruvec_kmem_state(void *p, enum node_stat_item idx,
  863. int val)
  864. {
  865. unsigned long flags;
  866. local_irq_save(flags);
  867. __mod_lruvec_kmem_state(p, idx, val);
  868. local_irq_restore(flags);
  869. }
  870. static inline void mod_memcg_lruvec_state(struct lruvec *lruvec,
  871. enum node_stat_item idx, int val)
  872. {
  873. unsigned long flags;
  874. local_irq_save(flags);
  875. __mod_memcg_lruvec_state(lruvec, idx, val);
  876. local_irq_restore(flags);
  877. }
  878. void __count_memcg_events(struct mem_cgroup *memcg, enum vm_event_item idx,
  879. unsigned long count);
  880. static inline void count_memcg_events(struct mem_cgroup *memcg,
  881. enum vm_event_item idx,
  882. unsigned long count)
  883. {
  884. unsigned long flags;
  885. local_irq_save(flags);
  886. __count_memcg_events(memcg, idx, count);
  887. local_irq_restore(flags);
  888. }
  889. static inline void count_memcg_page_event(struct page *page,
  890. enum vm_event_item idx)
  891. {
  892. struct mem_cgroup *memcg = page_memcg(page);
  893. if (memcg)
  894. count_memcg_events(memcg, idx, 1);
  895. }
  896. static inline void count_memcg_folio_events(struct folio *folio,
  897. enum vm_event_item idx, unsigned long nr)
  898. {
  899. struct mem_cgroup *memcg = folio_memcg(folio);
  900. if (memcg)
  901. count_memcg_events(memcg, idx, nr);
  902. }
  903. static inline void count_memcg_event_mm(struct mm_struct *mm,
  904. enum vm_event_item idx)
  905. {
  906. struct mem_cgroup *memcg;
  907. if (mem_cgroup_disabled())
  908. return;
  909. rcu_read_lock();
  910. memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
  911. if (likely(memcg))
  912. count_memcg_events(memcg, idx, 1);
  913. rcu_read_unlock();
  914. }
  915. static inline void memcg_memory_event(struct mem_cgroup *memcg,
  916. enum memcg_memory_event event)
  917. {
  918. bool swap_event = event == MEMCG_SWAP_HIGH || event == MEMCG_SWAP_MAX ||
  919. event == MEMCG_SWAP_FAIL;
  920. atomic_long_inc(&memcg->memory_events_local[event]);
  921. if (!swap_event)
  922. cgroup_file_notify(&memcg->events_local_file);
  923. do {
  924. atomic_long_inc(&memcg->memory_events[event]);
  925. if (swap_event)
  926. cgroup_file_notify(&memcg->swap_events_file);
  927. else
  928. cgroup_file_notify(&memcg->events_file);
  929. if (!cgroup_subsys_on_dfl(memory_cgrp_subsys))
  930. break;
  931. if (cgrp_dfl_root.flags & CGRP_ROOT_MEMORY_LOCAL_EVENTS)
  932. break;
  933. } while ((memcg = parent_mem_cgroup(memcg)) &&
  934. !mem_cgroup_is_root(memcg));
  935. }
  936. static inline void memcg_memory_event_mm(struct mm_struct *mm,
  937. enum memcg_memory_event event)
  938. {
  939. struct mem_cgroup *memcg;
  940. if (mem_cgroup_disabled())
  941. return;
  942. rcu_read_lock();
  943. memcg = mem_cgroup_from_task(rcu_dereference(mm->owner));
  944. if (likely(memcg))
  945. memcg_memory_event(memcg, event);
  946. rcu_read_unlock();
  947. }
  948. void split_page_memcg(struct page *head, unsigned int nr);
  949. unsigned long mem_cgroup_soft_limit_reclaim(pg_data_t *pgdat, int order,
  950. gfp_t gfp_mask,
  951. unsigned long *total_scanned);
  952. #else /* CONFIG_MEMCG */
  953. #define MEM_CGROUP_ID_SHIFT 0
  954. #define MEM_CGROUP_ID_MAX 0
  955. static inline struct mem_cgroup *folio_memcg(struct folio *folio)
  956. {
  957. return NULL;
  958. }
  959. static inline struct mem_cgroup *page_memcg(struct page *page)
  960. {
  961. return NULL;
  962. }
  963. static inline struct mem_cgroup *folio_memcg_rcu(struct folio *folio)
  964. {
  965. WARN_ON_ONCE(!rcu_read_lock_held());
  966. return NULL;
  967. }
  968. static inline struct mem_cgroup *page_memcg_check(struct page *page)
  969. {
  970. return NULL;
  971. }
  972. static inline bool folio_memcg_kmem(struct folio *folio)
  973. {
  974. return false;
  975. }
  976. static inline bool PageMemcgKmem(struct page *page)
  977. {
  978. return false;
  979. }
  980. static inline bool mem_cgroup_is_root(struct mem_cgroup *memcg)
  981. {
  982. return true;
  983. }
  984. static inline bool mem_cgroup_disabled(void)
  985. {
  986. return true;
  987. }
  988. static inline void memcg_memory_event(struct mem_cgroup *memcg,
  989. enum memcg_memory_event event)
  990. {
  991. }
  992. static inline void memcg_memory_event_mm(struct mm_struct *mm,
  993. enum memcg_memory_event event)
  994. {
  995. }
  996. static inline void mem_cgroup_protection(struct mem_cgroup *root,
  997. struct mem_cgroup *memcg,
  998. unsigned long *min,
  999. unsigned long *low)
  1000. {
  1001. *min = *low = 0;
  1002. }
  1003. static inline void mem_cgroup_calculate_protection(struct mem_cgroup *root,
  1004. struct mem_cgroup *memcg)
  1005. {
  1006. }
  1007. static inline bool mem_cgroup_below_low(struct mem_cgroup *memcg)
  1008. {
  1009. return false;
  1010. }
  1011. static inline bool mem_cgroup_below_min(struct mem_cgroup *memcg)
  1012. {
  1013. return false;
  1014. }
  1015. static inline int mem_cgroup_charge(struct folio *folio,
  1016. struct mm_struct *mm, gfp_t gfp)
  1017. {
  1018. return 0;
  1019. }
  1020. static inline int mem_cgroup_swapin_charge_folio(struct folio *folio,
  1021. struct mm_struct *mm, gfp_t gfp, swp_entry_t entry)
  1022. {
  1023. return 0;
  1024. }
  1025. static inline void mem_cgroup_swapin_uncharge_swap(swp_entry_t entry)
  1026. {
  1027. }
  1028. static inline void mem_cgroup_uncharge(struct folio *folio)
  1029. {
  1030. }
  1031. static inline void mem_cgroup_uncharge_list(struct list_head *page_list)
  1032. {
  1033. }
  1034. static inline void mem_cgroup_migrate(struct folio *old, struct folio *new)
  1035. {
  1036. }
  1037. static inline struct lruvec *mem_cgroup_lruvec(struct mem_cgroup *memcg,
  1038. struct pglist_data *pgdat)
  1039. {
  1040. return &pgdat->__lruvec;
  1041. }
  1042. static inline struct lruvec *folio_lruvec(struct folio *folio)
  1043. {
  1044. struct pglist_data *pgdat = folio_pgdat(folio);
  1045. return &pgdat->__lruvec;
  1046. }
  1047. static inline
  1048. void lruvec_memcg_debug(struct lruvec *lruvec, struct folio *folio)
  1049. {
  1050. }
  1051. static inline struct mem_cgroup *parent_mem_cgroup(struct mem_cgroup *memcg)
  1052. {
  1053. return NULL;
  1054. }
  1055. static inline bool mm_match_cgroup(struct mm_struct *mm,
  1056. struct mem_cgroup *memcg)
  1057. {
  1058. return true;
  1059. }
  1060. static inline struct mem_cgroup *get_mem_cgroup_from_mm(struct mm_struct *mm)
  1061. {
  1062. return NULL;
  1063. }
  1064. static inline
  1065. struct mem_cgroup *mem_cgroup_from_css(struct cgroup_subsys_state *css)
  1066. {
  1067. return NULL;
  1068. }
  1069. static inline void obj_cgroup_put(struct obj_cgroup *objcg)
  1070. {
  1071. }
  1072. static inline bool mem_cgroup_tryget(struct mem_cgroup *memcg)
  1073. {
  1074. return true;
  1075. }
  1076. static inline void mem_cgroup_put(struct mem_cgroup *memcg)
  1077. {
  1078. }
  1079. static inline struct lruvec *folio_lruvec_lock(struct folio *folio)
  1080. {
  1081. struct pglist_data *pgdat = folio_pgdat(folio);
  1082. spin_lock(&pgdat->__lruvec.lru_lock);
  1083. return &pgdat->__lruvec;
  1084. }
  1085. static inline struct lruvec *folio_lruvec_lock_irq(struct folio *folio)
  1086. {
  1087. struct pglist_data *pgdat = folio_pgdat(folio);
  1088. spin_lock_irq(&pgdat->__lruvec.lru_lock);
  1089. return &pgdat->__lruvec;
  1090. }
  1091. static inline struct lruvec *folio_lruvec_lock_irqsave(struct folio *folio,
  1092. unsigned long *flagsp)
  1093. {
  1094. struct pglist_data *pgdat = folio_pgdat(folio);
  1095. spin_lock_irqsave(&pgdat->__lruvec.lru_lock, *flagsp);
  1096. return &pgdat->__lruvec;
  1097. }
  1098. static inline struct mem_cgroup *
  1099. mem_cgroup_iter(struct mem_cgroup *root,
  1100. struct mem_cgroup *prev,
  1101. struct mem_cgroup_reclaim_cookie *reclaim)
  1102. {
  1103. return NULL;
  1104. }
  1105. static inline void mem_cgroup_iter_break(struct mem_cgroup *root,
  1106. struct mem_cgroup *prev)
  1107. {
  1108. }
  1109. static inline int mem_cgroup_scan_tasks(struct mem_cgroup *memcg,
  1110. int (*fn)(struct task_struct *, void *), void *arg)
  1111. {
  1112. return 0;
  1113. }
  1114. static inline unsigned short mem_cgroup_id(struct mem_cgroup *memcg)
  1115. {
  1116. return 0;
  1117. }
  1118. static inline struct mem_cgroup *mem_cgroup_from_id(unsigned short id)
  1119. {
  1120. WARN_ON_ONCE(id);
  1121. /* XXX: This should always return root_mem_cgroup */
  1122. return NULL;
  1123. }
  1124. #ifdef CONFIG_SHRINKER_DEBUG
  1125. static inline unsigned long mem_cgroup_ino(struct mem_cgroup *memcg)
  1126. {
  1127. return 0;
  1128. }
  1129. static inline struct mem_cgroup *mem_cgroup_get_from_ino(unsigned long ino)
  1130. {
  1131. return NULL;
  1132. }
  1133. #endif
  1134. static inline struct mem_cgroup *mem_cgroup_from_seq(struct seq_file *m)
  1135. {
  1136. return NULL;
  1137. }
  1138. static inline struct mem_cgroup *lruvec_memcg(struct lruvec *lruvec)
  1139. {
  1140. return NULL;
  1141. }
  1142. static inline bool mem_cgroup_online(struct mem_cgroup *memcg)
  1143. {
  1144. return true;
  1145. }
  1146. static inline
  1147. unsigned long mem_cgroup_get_zone_lru_size(struct lruvec *lruvec,
  1148. enum lru_list lru, int zone_idx)
  1149. {
  1150. return 0;
  1151. }
  1152. static inline unsigned long mem_cgroup_get_max(struct mem_cgroup *memcg)
  1153. {
  1154. return 0;
  1155. }
  1156. static inline unsigned long mem_cgroup_size(struct mem_cgroup *memcg)
  1157. {
  1158. return 0;
  1159. }
  1160. static inline void
  1161. mem_cgroup_print_oom_context(struct mem_cgroup *memcg, struct task_struct *p)
  1162. {
  1163. }
  1164. static inline void
  1165. mem_cgroup_print_oom_meminfo(struct mem_cgroup *memcg)
  1166. {
  1167. }
  1168. static inline void lock_page_memcg(struct page *page)
  1169. {
  1170. }
  1171. static inline void unlock_page_memcg(struct page *page)
  1172. {
  1173. }
  1174. static inline void folio_memcg_lock(struct folio *folio)
  1175. {
  1176. }
  1177. static inline void folio_memcg_unlock(struct folio *folio)
  1178. {
  1179. }
  1180. static inline bool mem_cgroup_trylock_pages(struct mem_cgroup *memcg)
  1181. {
  1182. /* to match folio_memcg_rcu() */
  1183. rcu_read_lock();
  1184. return true;
  1185. }
  1186. static inline void mem_cgroup_unlock_pages(void)
  1187. {
  1188. rcu_read_unlock();
  1189. }
  1190. static inline void mem_cgroup_handle_over_high(gfp_t gfp_mask)
  1191. {
  1192. }
  1193. static inline void mem_cgroup_enter_user_fault(void)
  1194. {
  1195. }
  1196. static inline void mem_cgroup_exit_user_fault(void)
  1197. {
  1198. }
  1199. static inline bool task_in_memcg_oom(struct task_struct *p)
  1200. {
  1201. return false;
  1202. }
  1203. static inline bool mem_cgroup_oom_synchronize(bool wait)
  1204. {
  1205. return false;
  1206. }
  1207. static inline struct mem_cgroup *mem_cgroup_get_oom_group(
  1208. struct task_struct *victim, struct mem_cgroup *oom_domain)
  1209. {
  1210. return NULL;
  1211. }
  1212. static inline void mem_cgroup_print_oom_group(struct mem_cgroup *memcg)
  1213. {
  1214. }
  1215. static inline void __mod_memcg_state(struct mem_cgroup *memcg,
  1216. int idx,
  1217. int nr)
  1218. {
  1219. }
  1220. static inline void mod_memcg_state(struct mem_cgroup *memcg,
  1221. int idx,
  1222. int nr)
  1223. {
  1224. }
  1225. static inline void mod_memcg_page_state(struct page *page,
  1226. int idx, int val)
  1227. {
  1228. }
  1229. static inline unsigned long memcg_page_state(struct mem_cgroup *memcg, int idx)
  1230. {
  1231. return 0;
  1232. }
  1233. static inline unsigned long lruvec_page_state(struct lruvec *lruvec,
  1234. enum node_stat_item idx)
  1235. {
  1236. return node_page_state(lruvec_pgdat(lruvec), idx);
  1237. }
  1238. static inline unsigned long lruvec_page_state_local(struct lruvec *lruvec,
  1239. enum node_stat_item idx)
  1240. {
  1241. return node_page_state(lruvec_pgdat(lruvec), idx);
  1242. }
  1243. static inline void mem_cgroup_flush_stats(void)
  1244. {
  1245. }
  1246. static inline void mem_cgroup_flush_stats_delayed(void)
  1247. {
  1248. }
  1249. static inline void __mod_memcg_lruvec_state(struct lruvec *lruvec,
  1250. enum node_stat_item idx, int val)
  1251. {
  1252. }
  1253. static inline void __mod_lruvec_kmem_state(void *p, enum node_stat_item idx,
  1254. int val)
  1255. {
  1256. struct page *page = virt_to_head_page(p);
  1257. __mod_node_page_state(page_pgdat(page), idx, val);
  1258. }
  1259. static inline void mod_lruvec_kmem_state(void *p, enum node_stat_item idx,
  1260. int val)
  1261. {
  1262. struct page *page = virt_to_head_page(p);
  1263. mod_node_page_state(page_pgdat(page), idx, val);
  1264. }
  1265. static inline void count_memcg_events(struct mem_cgroup *memcg,
  1266. enum vm_event_item idx,
  1267. unsigned long count)
  1268. {
  1269. }
  1270. static inline void __count_memcg_events(struct mem_cgroup *memcg,
  1271. enum vm_event_item idx,
  1272. unsigned long count)
  1273. {
  1274. }
  1275. static inline void count_memcg_page_event(struct page *page,
  1276. int idx)
  1277. {
  1278. }
  1279. static inline void count_memcg_folio_events(struct folio *folio,
  1280. enum vm_event_item idx, unsigned long nr)
  1281. {
  1282. }
  1283. static inline
  1284. void count_memcg_event_mm(struct mm_struct *mm, enum vm_event_item idx)
  1285. {
  1286. }
  1287. static inline void split_page_memcg(struct page *head, unsigned int nr)
  1288. {
  1289. }
  1290. static inline
  1291. unsigned long mem_cgroup_soft_limit_reclaim(pg_data_t *pgdat, int order,
  1292. gfp_t gfp_mask,
  1293. unsigned long *total_scanned)
  1294. {
  1295. return 0;
  1296. }
  1297. #endif /* CONFIG_MEMCG */
  1298. static inline void __inc_lruvec_kmem_state(void *p, enum node_stat_item idx)
  1299. {
  1300. __mod_lruvec_kmem_state(p, idx, 1);
  1301. }
  1302. static inline void __dec_lruvec_kmem_state(void *p, enum node_stat_item idx)
  1303. {
  1304. __mod_lruvec_kmem_state(p, idx, -1);
  1305. }
  1306. static inline struct lruvec *parent_lruvec(struct lruvec *lruvec)
  1307. {
  1308. struct mem_cgroup *memcg;
  1309. memcg = lruvec_memcg(lruvec);
  1310. if (!memcg)
  1311. return NULL;
  1312. memcg = parent_mem_cgroup(memcg);
  1313. if (!memcg)
  1314. return NULL;
  1315. return mem_cgroup_lruvec(memcg, lruvec_pgdat(lruvec));
  1316. }
  1317. static inline void unlock_page_lruvec(struct lruvec *lruvec)
  1318. {
  1319. spin_unlock(&lruvec->lru_lock);
  1320. }
  1321. static inline void unlock_page_lruvec_irq(struct lruvec *lruvec)
  1322. {
  1323. spin_unlock_irq(&lruvec->lru_lock);
  1324. }
  1325. static inline void unlock_page_lruvec_irqrestore(struct lruvec *lruvec,
  1326. unsigned long flags)
  1327. {
  1328. spin_unlock_irqrestore(&lruvec->lru_lock, flags);
  1329. }
  1330. /* Test requires a stable page->memcg binding, see page_memcg() */
  1331. static inline bool folio_matches_lruvec(struct folio *folio,
  1332. struct lruvec *lruvec)
  1333. {
  1334. return lruvec_pgdat(lruvec) == folio_pgdat(folio) &&
  1335. lruvec_memcg(lruvec) == folio_memcg(folio);
  1336. }
  1337. /* Don't lock again iff page's lruvec locked */
  1338. static inline struct lruvec *folio_lruvec_relock_irq(struct folio *folio,
  1339. struct lruvec *locked_lruvec)
  1340. {
  1341. if (locked_lruvec) {
  1342. if (folio_matches_lruvec(folio, locked_lruvec))
  1343. return locked_lruvec;
  1344. unlock_page_lruvec_irq(locked_lruvec);
  1345. }
  1346. return folio_lruvec_lock_irq(folio);
  1347. }
  1348. /* Don't lock again iff page's lruvec locked */
  1349. static inline struct lruvec *folio_lruvec_relock_irqsave(struct folio *folio,
  1350. struct lruvec *locked_lruvec, unsigned long *flags)
  1351. {
  1352. if (locked_lruvec) {
  1353. if (folio_matches_lruvec(folio, locked_lruvec))
  1354. return locked_lruvec;
  1355. unlock_page_lruvec_irqrestore(locked_lruvec, *flags);
  1356. }
  1357. return folio_lruvec_lock_irqsave(folio, flags);
  1358. }
  1359. #ifdef CONFIG_CGROUP_WRITEBACK
  1360. struct wb_domain *mem_cgroup_wb_domain(struct bdi_writeback *wb);
  1361. void mem_cgroup_wb_stats(struct bdi_writeback *wb, unsigned long *pfilepages,
  1362. unsigned long *pheadroom, unsigned long *pdirty,
  1363. unsigned long *pwriteback);
  1364. void mem_cgroup_track_foreign_dirty_slowpath(struct folio *folio,
  1365. struct bdi_writeback *wb);
  1366. static inline void mem_cgroup_track_foreign_dirty(struct folio *folio,
  1367. struct bdi_writeback *wb)
  1368. {
  1369. struct mem_cgroup *memcg;
  1370. if (mem_cgroup_disabled())
  1371. return;
  1372. memcg = folio_memcg(folio);
  1373. if (unlikely(memcg && &memcg->css != wb->memcg_css))
  1374. mem_cgroup_track_foreign_dirty_slowpath(folio, wb);
  1375. }
  1376. void mem_cgroup_flush_foreign(struct bdi_writeback *wb);
  1377. #else /* CONFIG_CGROUP_WRITEBACK */
  1378. static inline struct wb_domain *mem_cgroup_wb_domain(struct bdi_writeback *wb)
  1379. {
  1380. return NULL;
  1381. }
  1382. static inline void mem_cgroup_wb_stats(struct bdi_writeback *wb,
  1383. unsigned long *pfilepages,
  1384. unsigned long *pheadroom,
  1385. unsigned long *pdirty,
  1386. unsigned long *pwriteback)
  1387. {
  1388. }
  1389. static inline void mem_cgroup_track_foreign_dirty(struct folio *folio,
  1390. struct bdi_writeback *wb)
  1391. {
  1392. }
  1393. static inline void mem_cgroup_flush_foreign(struct bdi_writeback *wb)
  1394. {
  1395. }
  1396. #endif /* CONFIG_CGROUP_WRITEBACK */
  1397. struct sock;
  1398. bool mem_cgroup_charge_skmem(struct mem_cgroup *memcg, unsigned int nr_pages,
  1399. gfp_t gfp_mask);
  1400. void mem_cgroup_uncharge_skmem(struct mem_cgroup *memcg, unsigned int nr_pages);
  1401. #ifdef CONFIG_MEMCG
  1402. extern struct static_key_false memcg_sockets_enabled_key;
  1403. #define mem_cgroup_sockets_enabled static_branch_unlikely(&memcg_sockets_enabled_key)
  1404. void mem_cgroup_sk_alloc(struct sock *sk);
  1405. void mem_cgroup_sk_free(struct sock *sk);
  1406. static inline bool mem_cgroup_under_socket_pressure(struct mem_cgroup *memcg)
  1407. {
  1408. if (!cgroup_subsys_on_dfl(memory_cgrp_subsys))
  1409. return !!memcg->tcpmem_pressure;
  1410. do {
  1411. if (time_before(jiffies, READ_ONCE(memcg->socket_pressure)))
  1412. return true;
  1413. } while ((memcg = parent_mem_cgroup(memcg)));
  1414. return false;
  1415. }
  1416. int alloc_shrinker_info(struct mem_cgroup *memcg);
  1417. void free_shrinker_info(struct mem_cgroup *memcg);
  1418. void set_shrinker_bit(struct mem_cgroup *memcg, int nid, int shrinker_id);
  1419. void reparent_shrinker_deferred(struct mem_cgroup *memcg);
  1420. #else
  1421. #define mem_cgroup_sockets_enabled 0
  1422. static inline void mem_cgroup_sk_alloc(struct sock *sk) { };
  1423. static inline void mem_cgroup_sk_free(struct sock *sk) { };
  1424. static inline bool mem_cgroup_under_socket_pressure(struct mem_cgroup *memcg)
  1425. {
  1426. return false;
  1427. }
  1428. static inline void set_shrinker_bit(struct mem_cgroup *memcg,
  1429. int nid, int shrinker_id)
  1430. {
  1431. }
  1432. #endif
  1433. #ifdef CONFIG_MEMCG_KMEM
  1434. bool mem_cgroup_kmem_disabled(void);
  1435. int __memcg_kmem_charge_page(struct page *page, gfp_t gfp, int order);
  1436. void __memcg_kmem_uncharge_page(struct page *page, int order);
  1437. struct obj_cgroup *get_obj_cgroup_from_current(void);
  1438. struct obj_cgroup *get_obj_cgroup_from_page(struct page *page);
  1439. int obj_cgroup_charge(struct obj_cgroup *objcg, gfp_t gfp, size_t size);
  1440. void obj_cgroup_uncharge(struct obj_cgroup *objcg, size_t size);
  1441. extern struct static_key_false memcg_kmem_enabled_key;
  1442. static inline bool memcg_kmem_enabled(void)
  1443. {
  1444. return static_branch_likely(&memcg_kmem_enabled_key);
  1445. }
  1446. static inline int memcg_kmem_charge_page(struct page *page, gfp_t gfp,
  1447. int order)
  1448. {
  1449. if (memcg_kmem_enabled())
  1450. return __memcg_kmem_charge_page(page, gfp, order);
  1451. return 0;
  1452. }
  1453. static inline void memcg_kmem_uncharge_page(struct page *page, int order)
  1454. {
  1455. if (memcg_kmem_enabled())
  1456. __memcg_kmem_uncharge_page(page, order);
  1457. }
  1458. /*
  1459. * A helper for accessing memcg's kmem_id, used for getting
  1460. * corresponding LRU lists.
  1461. */
  1462. static inline int memcg_kmem_id(struct mem_cgroup *memcg)
  1463. {
  1464. return memcg ? memcg->kmemcg_id : -1;
  1465. }
  1466. struct mem_cgroup *mem_cgroup_from_obj(void *p);
  1467. struct mem_cgroup *mem_cgroup_from_slab_obj(void *p);
  1468. static inline void count_objcg_event(struct obj_cgroup *objcg,
  1469. enum vm_event_item idx)
  1470. {
  1471. struct mem_cgroup *memcg;
  1472. if (!memcg_kmem_enabled())
  1473. return;
  1474. rcu_read_lock();
  1475. memcg = obj_cgroup_memcg(objcg);
  1476. count_memcg_events(memcg, idx, 1);
  1477. rcu_read_unlock();
  1478. }
  1479. #else
  1480. static inline bool mem_cgroup_kmem_disabled(void)
  1481. {
  1482. return true;
  1483. }
  1484. static inline int memcg_kmem_charge_page(struct page *page, gfp_t gfp,
  1485. int order)
  1486. {
  1487. return 0;
  1488. }
  1489. static inline void memcg_kmem_uncharge_page(struct page *page, int order)
  1490. {
  1491. }
  1492. static inline int __memcg_kmem_charge_page(struct page *page, gfp_t gfp,
  1493. int order)
  1494. {
  1495. return 0;
  1496. }
  1497. static inline void __memcg_kmem_uncharge_page(struct page *page, int order)
  1498. {
  1499. }
  1500. static inline struct obj_cgroup *get_obj_cgroup_from_page(struct page *page)
  1501. {
  1502. return NULL;
  1503. }
  1504. static inline bool memcg_kmem_enabled(void)
  1505. {
  1506. return false;
  1507. }
  1508. static inline int memcg_kmem_id(struct mem_cgroup *memcg)
  1509. {
  1510. return -1;
  1511. }
  1512. static inline struct mem_cgroup *mem_cgroup_from_obj(void *p)
  1513. {
  1514. return NULL;
  1515. }
  1516. static inline struct mem_cgroup *mem_cgroup_from_slab_obj(void *p)
  1517. {
  1518. return NULL;
  1519. }
  1520. static inline void count_objcg_event(struct obj_cgroup *objcg,
  1521. enum vm_event_item idx)
  1522. {
  1523. }
  1524. #endif /* CONFIG_MEMCG_KMEM */
  1525. #if defined(CONFIG_MEMCG_KMEM) && defined(CONFIG_ZSWAP)
  1526. bool obj_cgroup_may_zswap(struct obj_cgroup *objcg);
  1527. void obj_cgroup_charge_zswap(struct obj_cgroup *objcg, size_t size);
  1528. void obj_cgroup_uncharge_zswap(struct obj_cgroup *objcg, size_t size);
  1529. #else
  1530. static inline bool obj_cgroup_may_zswap(struct obj_cgroup *objcg)
  1531. {
  1532. return true;
  1533. }
  1534. static inline void obj_cgroup_charge_zswap(struct obj_cgroup *objcg,
  1535. size_t size)
  1536. {
  1537. }
  1538. static inline void obj_cgroup_uncharge_zswap(struct obj_cgroup *objcg,
  1539. size_t size)
  1540. {
  1541. }
  1542. #endif
  1543. #endif /* _LINUX_MEMCONTROL_H */