1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883 |
- #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
- #include <linux/mm.h>
- #include <linux/module.h>
- #include <linux/gfp.h>
- #include <linux/kernel_stat.h>
- #include <linux/swap.h>
- #include <linux/pagemap.h>
- #include <linux/init.h>
- #include <linux/highmem.h>
- #include <linux/vmpressure.h>
- #include <linux/vmstat.h>
- #include <linux/file.h>
- #include <linux/writeback.h>
- #include <linux/blkdev.h>
- #include <linux/buffer_head.h> /* for try_to_release_page(),
- buffer_heads_over_limit */
- #include <linux/mm_inline.h>
- #include <linux/backing-dev.h>
- #include <linux/rmap.h>
- #include <linux/topology.h>
- #include <linux/cpu.h>
- #include <linux/cpuset.h>
- #include <linux/compaction.h>
- #include <linux/notifier.h>
- #include <linux/rwsem.h>
- #include <linux/delay.h>
- #include <linux/kthread.h>
- #include <linux/freezer.h>
- #include <linux/memcontrol.h>
- #include <linux/delayacct.h>
- #include <linux/sysctl.h>
- #include <linux/oom.h>
- #include <linux/prefetch.h>
- #include <linux/printk.h>
- #include <linux/dax.h>
- #include <asm/tlbflush.h>
- #include <asm/div64.h>
- #include <linux/swapops.h>
- #include <linux/balloon_compaction.h>
- #include "internal.h"
- #define CREATE_TRACE_POINTS
- #include <trace/events/vmscan.h>
- struct scan_control {
-
- unsigned long nr_to_reclaim;
-
- gfp_t gfp_mask;
-
- int order;
-
- nodemask_t *nodemask;
-
- struct mem_cgroup *target_mem_cgroup;
-
- int priority;
-
- enum zone_type reclaim_idx;
- unsigned int may_writepage:1;
-
- unsigned int may_unmap:1;
-
- unsigned int may_swap:1;
-
- unsigned int may_thrash:1;
- unsigned int hibernation_mode:1;
-
- unsigned int compaction_ready:1;
-
- unsigned long nr_scanned;
-
- unsigned long nr_reclaimed;
- };
- #ifdef ARCH_HAS_PREFETCH
- #define prefetch_prev_lru_page(_page, _base, _field) \
- do { \
- if ((_page)->lru.prev != _base) { \
- struct page *prev; \
- \
- prev = lru_to_page(&(_page->lru)); \
- prefetch(&prev->_field); \
- } \
- } while (0)
- #else
- #define prefetch_prev_lru_page(_page, _base, _field) do { } while (0)
- #endif
- #ifdef ARCH_HAS_PREFETCHW
- #define prefetchw_prev_lru_page(_page, _base, _field) \
- do { \
- if ((_page)->lru.prev != _base) { \
- struct page *prev; \
- \
- prev = lru_to_page(&(_page->lru)); \
- prefetchw(&prev->_field); \
- } \
- } while (0)
- #else
- #define prefetchw_prev_lru_page(_page, _base, _field) do { } while (0)
- #endif
- int vm_swappiness = 60;
- unsigned long vm_total_pages;
- static LIST_HEAD(shrinker_list);
- static DECLARE_RWSEM(shrinker_rwsem);
- #ifdef CONFIG_MEMCG
- static bool global_reclaim(struct scan_control *sc)
- {
- return !sc->target_mem_cgroup;
- }
- static bool sane_reclaim(struct scan_control *sc)
- {
- struct mem_cgroup *memcg = sc->target_mem_cgroup;
- if (!memcg)
- return true;
- #ifdef CONFIG_CGROUP_WRITEBACK
- if (cgroup_subsys_on_dfl(memory_cgrp_subsys))
- return true;
- #endif
- return false;
- }
- #else
- static bool global_reclaim(struct scan_control *sc)
- {
- return true;
- }
- static bool sane_reclaim(struct scan_control *sc)
- {
- return true;
- }
- #endif
- unsigned long zone_reclaimable_pages(struct zone *zone)
- {
- unsigned long nr;
- nr = zone_page_state_snapshot(zone, NR_ZONE_INACTIVE_FILE) +
- zone_page_state_snapshot(zone, NR_ZONE_ACTIVE_FILE);
- if (get_nr_swap_pages() > 0)
- nr += zone_page_state_snapshot(zone, NR_ZONE_INACTIVE_ANON) +
- zone_page_state_snapshot(zone, NR_ZONE_ACTIVE_ANON);
- return nr;
- }
- unsigned long pgdat_reclaimable_pages(struct pglist_data *pgdat)
- {
- unsigned long nr;
- nr = node_page_state_snapshot(pgdat, NR_ACTIVE_FILE) +
- node_page_state_snapshot(pgdat, NR_INACTIVE_FILE) +
- node_page_state_snapshot(pgdat, NR_ISOLATED_FILE);
- if (get_nr_swap_pages() > 0)
- nr += node_page_state_snapshot(pgdat, NR_ACTIVE_ANON) +
- node_page_state_snapshot(pgdat, NR_INACTIVE_ANON) +
- node_page_state_snapshot(pgdat, NR_ISOLATED_ANON);
- return nr;
- }
- bool pgdat_reclaimable(struct pglist_data *pgdat)
- {
- return node_page_state_snapshot(pgdat, NR_PAGES_SCANNED) <
- pgdat_reclaimable_pages(pgdat) * 6;
- }
- unsigned long lruvec_lru_size(struct lruvec *lruvec, enum lru_list lru, int zone_idx)
- {
- unsigned long lru_size;
- int zid;
- if (!mem_cgroup_disabled())
- lru_size = mem_cgroup_get_lru_size(lruvec, lru);
- else
- lru_size = node_page_state(lruvec_pgdat(lruvec), NR_LRU_BASE + lru);
- for (zid = zone_idx + 1; zid < MAX_NR_ZONES; zid++) {
- struct zone *zone = &lruvec_pgdat(lruvec)->node_zones[zid];
- unsigned long size;
- if (!managed_zone(zone))
- continue;
- if (!mem_cgroup_disabled())
- size = mem_cgroup_get_zone_lru_size(lruvec, lru, zid);
- else
- size = zone_page_state(&lruvec_pgdat(lruvec)->node_zones[zid],
- NR_ZONE_LRU_BASE + lru);
- lru_size -= min(size, lru_size);
- }
- return lru_size;
- }
- int register_shrinker(struct shrinker *shrinker)
- {
- size_t size = sizeof(*shrinker->nr_deferred);
- if (shrinker->flags & SHRINKER_NUMA_AWARE)
- size *= nr_node_ids;
- shrinker->nr_deferred = kzalloc(size, GFP_KERNEL);
- if (!shrinker->nr_deferred)
- return -ENOMEM;
- down_write(&shrinker_rwsem);
- list_add_tail(&shrinker->list, &shrinker_list);
- up_write(&shrinker_rwsem);
- return 0;
- }
- EXPORT_SYMBOL(register_shrinker);
- void unregister_shrinker(struct shrinker *shrinker)
- {
- down_write(&shrinker_rwsem);
- list_del(&shrinker->list);
- up_write(&shrinker_rwsem);
- kfree(shrinker->nr_deferred);
- }
- EXPORT_SYMBOL(unregister_shrinker);
- #define SHRINK_BATCH 128
- static unsigned long do_shrink_slab(struct shrink_control *shrinkctl,
- struct shrinker *shrinker,
- unsigned long nr_scanned,
- unsigned long nr_eligible)
- {
- unsigned long freed = 0;
- unsigned long long delta;
- long total_scan;
- long freeable;
- long nr;
- long new_nr;
- int nid = shrinkctl->nid;
- long batch_size = shrinker->batch ? shrinker->batch
- : SHRINK_BATCH;
- long scanned = 0, next_deferred;
- freeable = shrinker->count_objects(shrinker, shrinkctl);
- if (freeable == 0)
- return 0;
-
- nr = atomic_long_xchg(&shrinker->nr_deferred[nid], 0);
- total_scan = nr;
- delta = (4 * nr_scanned) / shrinker->seeks;
- delta *= freeable;
- do_div(delta, nr_eligible + 1);
- total_scan += delta;
- if (total_scan < 0) {
- pr_err("shrink_slab: %pF negative objects to delete nr=%ld\n",
- shrinker->scan_objects, total_scan);
- total_scan = freeable;
- next_deferred = nr;
- } else
- next_deferred = total_scan;
-
- if (delta < freeable / 4)
- total_scan = min(total_scan, freeable / 2);
-
- if (total_scan > freeable * 2)
- total_scan = freeable * 2;
- trace_mm_shrink_slab_start(shrinker, shrinkctl, nr,
- nr_scanned, nr_eligible,
- freeable, delta, total_scan);
-
- while (total_scan >= batch_size ||
- total_scan >= freeable) {
- unsigned long ret;
- unsigned long nr_to_scan = min(batch_size, total_scan);
- shrinkctl->nr_to_scan = nr_to_scan;
- ret = shrinker->scan_objects(shrinker, shrinkctl);
- if (ret == SHRINK_STOP)
- break;
- freed += ret;
- count_vm_events(SLABS_SCANNED, nr_to_scan);
- total_scan -= nr_to_scan;
- scanned += nr_to_scan;
- cond_resched();
- }
- if (next_deferred >= scanned)
- next_deferred -= scanned;
- else
- next_deferred = 0;
-
- if (next_deferred > 0)
- new_nr = atomic_long_add_return(next_deferred,
- &shrinker->nr_deferred[nid]);
- else
- new_nr = atomic_long_read(&shrinker->nr_deferred[nid]);
- trace_mm_shrink_slab_end(shrinker, nid, freed, nr, new_nr, total_scan);
- return freed;
- }
- static unsigned long shrink_slab(gfp_t gfp_mask, int nid,
- struct mem_cgroup *memcg,
- unsigned long nr_scanned,
- unsigned long nr_eligible)
- {
- struct shrinker *shrinker;
- unsigned long freed = 0;
- if (memcg && (!memcg_kmem_enabled() || !mem_cgroup_online(memcg)))
- return 0;
- if (nr_scanned == 0)
- nr_scanned = SWAP_CLUSTER_MAX;
- if (!down_read_trylock(&shrinker_rwsem)) {
-
- freed = 1;
- goto out;
- }
- list_for_each_entry(shrinker, &shrinker_list, list) {
- struct shrink_control sc = {
- .gfp_mask = gfp_mask,
- .nid = nid,
- .memcg = memcg,
- };
-
- if (memcg_kmem_enabled() &&
- !!memcg != !!(shrinker->flags & SHRINKER_MEMCG_AWARE))
- continue;
- if (!(shrinker->flags & SHRINKER_NUMA_AWARE))
- sc.nid = 0;
- freed += do_shrink_slab(&sc, shrinker, nr_scanned, nr_eligible);
- }
- up_read(&shrinker_rwsem);
- out:
- cond_resched();
- return freed;
- }
- void drop_slab_node(int nid)
- {
- unsigned long freed;
- do {
- struct mem_cgroup *memcg = NULL;
- freed = 0;
- do {
- freed += shrink_slab(GFP_KERNEL, nid, memcg,
- 1000, 1000);
- } while ((memcg = mem_cgroup_iter(NULL, memcg, NULL)) != NULL);
- } while (freed > 10);
- }
- void drop_slab(void)
- {
- int nid;
- for_each_online_node(nid)
- drop_slab_node(nid);
- }
- static inline int is_page_cache_freeable(struct page *page)
- {
-
- return page_count(page) - page_has_private(page) == 2;
- }
- static int may_write_to_inode(struct inode *inode, struct scan_control *sc)
- {
- if (current->flags & PF_SWAPWRITE)
- return 1;
- if (!inode_write_congested(inode))
- return 1;
- if (inode_to_bdi(inode) == current->backing_dev_info)
- return 1;
- return 0;
- }
- static void handle_write_error(struct address_space *mapping,
- struct page *page, int error)
- {
- lock_page(page);
- if (page_mapping(page) == mapping)
- mapping_set_error(mapping, error);
- unlock_page(page);
- }
- typedef enum {
-
- PAGE_KEEP,
-
- PAGE_ACTIVATE,
-
- PAGE_SUCCESS,
-
- PAGE_CLEAN,
- } pageout_t;
- static pageout_t pageout(struct page *page, struct address_space *mapping,
- struct scan_control *sc)
- {
-
- if (!is_page_cache_freeable(page))
- return PAGE_KEEP;
- if (!mapping) {
-
- if (page_has_private(page)) {
- if (try_to_free_buffers(page)) {
- ClearPageDirty(page);
- pr_info("%s: orphaned page\n", __func__);
- return PAGE_CLEAN;
- }
- }
- return PAGE_KEEP;
- }
- if (mapping->a_ops->writepage == NULL)
- return PAGE_ACTIVATE;
- if (!may_write_to_inode(mapping->host, sc))
- return PAGE_KEEP;
- if (clear_page_dirty_for_io(page)) {
- int res;
- struct writeback_control wbc = {
- .sync_mode = WB_SYNC_NONE,
- .nr_to_write = SWAP_CLUSTER_MAX,
- .range_start = 0,
- .range_end = LLONG_MAX,
- .for_reclaim = 1,
- };
- SetPageReclaim(page);
- res = mapping->a_ops->writepage(page, &wbc);
- if (res < 0)
- handle_write_error(mapping, page, res);
- if (res == AOP_WRITEPAGE_ACTIVATE) {
- ClearPageReclaim(page);
- return PAGE_ACTIVATE;
- }
- if (!PageWriteback(page)) {
-
- ClearPageReclaim(page);
- }
- trace_mm_vmscan_writepage(page);
- inc_node_page_state(page, NR_VMSCAN_WRITE);
- return PAGE_SUCCESS;
- }
- return PAGE_CLEAN;
- }
- static int __remove_mapping(struct address_space *mapping, struct page *page,
- bool reclaimed)
- {
- unsigned long flags;
- BUG_ON(!PageLocked(page));
- BUG_ON(mapping != page_mapping(page));
- spin_lock_irqsave(&mapping->tree_lock, flags);
-
- if (!page_ref_freeze(page, 2))
- goto cannot_free;
-
- if (unlikely(PageDirty(page))) {
- page_ref_unfreeze(page, 2);
- goto cannot_free;
- }
- if (PageSwapCache(page)) {
- swp_entry_t swap = { .val = page_private(page) };
- mem_cgroup_swapout(page, swap);
- __delete_from_swap_cache(page);
- spin_unlock_irqrestore(&mapping->tree_lock, flags);
- swapcache_free(swap);
- } else {
- void (*freepage)(struct page *);
- void *shadow = NULL;
- freepage = mapping->a_ops->freepage;
-
- if (reclaimed && page_is_file_cache(page) &&
- !mapping_exiting(mapping) && !dax_mapping(mapping))
- shadow = workingset_eviction(mapping, page);
- __delete_from_page_cache(page, shadow);
- spin_unlock_irqrestore(&mapping->tree_lock, flags);
- if (freepage != NULL)
- freepage(page);
- }
- return 1;
- cannot_free:
- spin_unlock_irqrestore(&mapping->tree_lock, flags);
- return 0;
- }
- int remove_mapping(struct address_space *mapping, struct page *page)
- {
- if (__remove_mapping(mapping, page, false)) {
-
- page_ref_unfreeze(page, 1);
- return 1;
- }
- return 0;
- }
- void putback_lru_page(struct page *page)
- {
- bool is_unevictable;
- int was_unevictable = PageUnevictable(page);
- VM_BUG_ON_PAGE(PageLRU(page), page);
- redo:
- ClearPageUnevictable(page);
- if (page_evictable(page)) {
-
- is_unevictable = false;
- lru_cache_add(page);
- } else {
-
- is_unevictable = true;
- add_page_to_unevictable_list(page);
-
- smp_mb();
- }
-
- if (is_unevictable && page_evictable(page)) {
- if (!isolate_lru_page(page)) {
- put_page(page);
- goto redo;
- }
-
- }
- if (was_unevictable && !is_unevictable)
- count_vm_event(UNEVICTABLE_PGRESCUED);
- else if (!was_unevictable && is_unevictable)
- count_vm_event(UNEVICTABLE_PGCULLED);
- put_page(page);
- }
- enum page_references {
- PAGEREF_RECLAIM,
- PAGEREF_RECLAIM_CLEAN,
- PAGEREF_KEEP,
- PAGEREF_ACTIVATE,
- };
- static enum page_references page_check_references(struct page *page,
- struct scan_control *sc)
- {
- int referenced_ptes, referenced_page;
- unsigned long vm_flags;
- referenced_ptes = page_referenced(page, 1, sc->target_mem_cgroup,
- &vm_flags);
- referenced_page = TestClearPageReferenced(page);
-
- if (vm_flags & VM_LOCKED)
- return PAGEREF_RECLAIM;
- if (referenced_ptes) {
- if (PageSwapBacked(page))
- return PAGEREF_ACTIVATE;
-
- SetPageReferenced(page);
- if (referenced_page || referenced_ptes > 1)
- return PAGEREF_ACTIVATE;
-
- if (vm_flags & VM_EXEC)
- return PAGEREF_ACTIVATE;
- return PAGEREF_KEEP;
- }
-
- if (referenced_page && !PageSwapBacked(page))
- return PAGEREF_RECLAIM_CLEAN;
- return PAGEREF_RECLAIM;
- }
- static void page_check_dirty_writeback(struct page *page,
- bool *dirty, bool *writeback)
- {
- struct address_space *mapping;
-
- if (!page_is_file_cache(page)) {
- *dirty = false;
- *writeback = false;
- return;
- }
-
- *dirty = PageDirty(page);
- *writeback = PageWriteback(page);
-
- if (!page_has_private(page))
- return;
- mapping = page_mapping(page);
- if (mapping && mapping->a_ops->is_dirty_writeback)
- mapping->a_ops->is_dirty_writeback(page, dirty, writeback);
- }
- static unsigned long shrink_page_list(struct list_head *page_list,
- struct pglist_data *pgdat,
- struct scan_control *sc,
- enum ttu_flags ttu_flags,
- unsigned long *ret_nr_dirty,
- unsigned long *ret_nr_unqueued_dirty,
- unsigned long *ret_nr_congested,
- unsigned long *ret_nr_writeback,
- unsigned long *ret_nr_immediate,
- bool force_reclaim)
- {
- LIST_HEAD(ret_pages);
- LIST_HEAD(free_pages);
- int pgactivate = 0;
- unsigned long nr_unqueued_dirty = 0;
- unsigned long nr_dirty = 0;
- unsigned long nr_congested = 0;
- unsigned long nr_reclaimed = 0;
- unsigned long nr_writeback = 0;
- unsigned long nr_immediate = 0;
- cond_resched();
- while (!list_empty(page_list)) {
- struct address_space *mapping;
- struct page *page;
- int may_enter_fs;
- enum page_references references = PAGEREF_RECLAIM_CLEAN;
- bool dirty, writeback;
- bool lazyfree = false;
- int ret = SWAP_SUCCESS;
- cond_resched();
- page = lru_to_page(page_list);
- list_del(&page->lru);
- if (!trylock_page(page))
- goto keep;
- VM_BUG_ON_PAGE(PageActive(page), page);
- sc->nr_scanned++;
- if (unlikely(!page_evictable(page)))
- goto cull_mlocked;
- if (!sc->may_unmap && page_mapped(page))
- goto keep_locked;
-
- if (page_mapped(page) || PageSwapCache(page))
- sc->nr_scanned++;
- may_enter_fs = (sc->gfp_mask & __GFP_FS) ||
- (PageSwapCache(page) && (sc->gfp_mask & __GFP_IO));
-
- page_check_dirty_writeback(page, &dirty, &writeback);
- if (dirty || writeback)
- nr_dirty++;
- if (dirty && !writeback)
- nr_unqueued_dirty++;
-
- mapping = page_mapping(page);
- if (((dirty || writeback) && mapping &&
- inode_write_congested(mapping->host)) ||
- (writeback && PageReclaim(page)))
- nr_congested++;
-
- if (PageWriteback(page)) {
-
- if (current_is_kswapd() &&
- PageReclaim(page) &&
- test_bit(PGDAT_WRITEBACK, &pgdat->flags)) {
- nr_immediate++;
- goto keep_locked;
-
- } else if (sane_reclaim(sc) ||
- !PageReclaim(page) || !may_enter_fs) {
-
- SetPageReclaim(page);
- nr_writeback++;
- goto keep_locked;
-
- } else {
- unlock_page(page);
- wait_on_page_writeback(page);
-
- list_add_tail(&page->lru, page_list);
- continue;
- }
- }
- if (!force_reclaim)
- references = page_check_references(page, sc);
- switch (references) {
- case PAGEREF_ACTIVATE:
- goto activate_locked;
- case PAGEREF_KEEP:
- goto keep_locked;
- case PAGEREF_RECLAIM:
- case PAGEREF_RECLAIM_CLEAN:
- ;
- }
-
- if (PageAnon(page) && !PageSwapCache(page)) {
- if (!(sc->gfp_mask & __GFP_IO))
- goto keep_locked;
- if (!add_to_swap(page, page_list))
- goto activate_locked;
- lazyfree = true;
- may_enter_fs = 1;
-
- mapping = page_mapping(page);
- } else if (unlikely(PageTransHuge(page))) {
-
- if (split_huge_page_to_list(page, page_list))
- goto keep_locked;
- }
- VM_BUG_ON_PAGE(PageTransHuge(page), page);
-
- if (page_mapped(page) && mapping) {
- switch (ret = try_to_unmap(page, lazyfree ?
- (ttu_flags | TTU_BATCH_FLUSH | TTU_LZFREE) :
- (ttu_flags | TTU_BATCH_FLUSH))) {
- case SWAP_FAIL:
- goto activate_locked;
- case SWAP_AGAIN:
- goto keep_locked;
- case SWAP_MLOCK:
- goto cull_mlocked;
- case SWAP_LZFREE:
- goto lazyfree;
- case SWAP_SUCCESS:
- ;
- }
- }
- if (PageDirty(page)) {
-
- if (page_is_file_cache(page) &&
- (!current_is_kswapd() ||
- !test_bit(PGDAT_DIRTY, &pgdat->flags))) {
-
- inc_node_page_state(page, NR_VMSCAN_IMMEDIATE);
- SetPageReclaim(page);
- goto keep_locked;
- }
- if (references == PAGEREF_RECLAIM_CLEAN)
- goto keep_locked;
- if (!may_enter_fs)
- goto keep_locked;
- if (!sc->may_writepage)
- goto keep_locked;
-
- try_to_unmap_flush_dirty();
- switch (pageout(page, mapping, sc)) {
- case PAGE_KEEP:
- goto keep_locked;
- case PAGE_ACTIVATE:
- goto activate_locked;
- case PAGE_SUCCESS:
- if (PageWriteback(page))
- goto keep;
- if (PageDirty(page))
- goto keep;
-
- if (!trylock_page(page))
- goto keep;
- if (PageDirty(page) || PageWriteback(page))
- goto keep_locked;
- mapping = page_mapping(page);
- case PAGE_CLEAN:
- ;
- }
- }
-
- if (page_has_private(page)) {
- if (!try_to_release_page(page, sc->gfp_mask))
- goto activate_locked;
- if (!mapping && page_count(page) == 1) {
- unlock_page(page);
- if (put_page_testzero(page))
- goto free_it;
- else {
-
- nr_reclaimed++;
- continue;
- }
- }
- }
- lazyfree:
- if (!mapping || !__remove_mapping(mapping, page, true))
- goto keep_locked;
-
- __ClearPageLocked(page);
- free_it:
- if (ret == SWAP_LZFREE)
- count_vm_event(PGLAZYFREED);
- nr_reclaimed++;
-
- list_add(&page->lru, &free_pages);
- continue;
- cull_mlocked:
- if (PageSwapCache(page))
- try_to_free_swap(page);
- unlock_page(page);
- list_add(&page->lru, &ret_pages);
- continue;
- activate_locked:
-
- if (PageSwapCache(page) && mem_cgroup_swap_full(page))
- try_to_free_swap(page);
- VM_BUG_ON_PAGE(PageActive(page), page);
- SetPageActive(page);
- pgactivate++;
- keep_locked:
- unlock_page(page);
- keep:
- list_add(&page->lru, &ret_pages);
- VM_BUG_ON_PAGE(PageLRU(page) || PageUnevictable(page), page);
- }
- mem_cgroup_uncharge_list(&free_pages);
- try_to_unmap_flush();
- free_hot_cold_page_list(&free_pages, true);
- list_splice(&ret_pages, page_list);
- count_vm_events(PGACTIVATE, pgactivate);
- *ret_nr_dirty += nr_dirty;
- *ret_nr_congested += nr_congested;
- *ret_nr_unqueued_dirty += nr_unqueued_dirty;
- *ret_nr_writeback += nr_writeback;
- *ret_nr_immediate += nr_immediate;
- return nr_reclaimed;
- }
- unsigned long reclaim_clean_pages_from_list(struct zone *zone,
- struct list_head *page_list)
- {
- struct scan_control sc = {
- .gfp_mask = GFP_KERNEL,
- .priority = DEF_PRIORITY,
- .may_unmap = 1,
- };
- unsigned long ret, dummy1, dummy2, dummy3, dummy4, dummy5;
- struct page *page, *next;
- LIST_HEAD(clean_pages);
- list_for_each_entry_safe(page, next, page_list, lru) {
- if (page_is_file_cache(page) && !PageDirty(page) &&
- !__PageMovable(page)) {
- ClearPageActive(page);
- list_move(&page->lru, &clean_pages);
- }
- }
- ret = shrink_page_list(&clean_pages, zone->zone_pgdat, &sc,
- TTU_UNMAP|TTU_IGNORE_ACCESS,
- &dummy1, &dummy2, &dummy3, &dummy4, &dummy5, true);
- list_splice(&clean_pages, page_list);
- mod_node_page_state(zone->zone_pgdat, NR_ISOLATED_FILE, -ret);
- return ret;
- }
- int __isolate_lru_page(struct page *page, isolate_mode_t mode)
- {
- int ret = -EINVAL;
-
- if (!PageLRU(page))
- return ret;
-
- if (PageUnevictable(page) && !(mode & ISOLATE_UNEVICTABLE))
- return ret;
- ret = -EBUSY;
-
- if (mode & (ISOLATE_CLEAN|ISOLATE_ASYNC_MIGRATE)) {
-
- if (PageWriteback(page))
- return ret;
- if (PageDirty(page)) {
- struct address_space *mapping;
-
- if (mode & ISOLATE_CLEAN)
- return ret;
-
- mapping = page_mapping(page);
- if (mapping && !mapping->a_ops->migratepage)
- return ret;
- }
- }
- if ((mode & ISOLATE_UNMAPPED) && page_mapped(page))
- return ret;
- if (likely(get_page_unless_zero(page))) {
-
- ClearPageLRU(page);
- ret = 0;
- }
- return ret;
- }
- static __always_inline void update_lru_sizes(struct lruvec *lruvec,
- enum lru_list lru, unsigned long *nr_zone_taken)
- {
- int zid;
- for (zid = 0; zid < MAX_NR_ZONES; zid++) {
- if (!nr_zone_taken[zid])
- continue;
- __update_lru_size(lruvec, lru, zid, -nr_zone_taken[zid]);
- #ifdef CONFIG_MEMCG
- mem_cgroup_update_lru_size(lruvec, lru, zid, -nr_zone_taken[zid]);
- #endif
- }
- }
- static unsigned long isolate_lru_pages(unsigned long nr_to_scan,
- struct lruvec *lruvec, struct list_head *dst,
- unsigned long *nr_scanned, struct scan_control *sc,
- isolate_mode_t mode, enum lru_list lru)
- {
- struct list_head *src = &lruvec->lists[lru];
- unsigned long nr_taken = 0;
- unsigned long nr_zone_taken[MAX_NR_ZONES] = { 0 };
- unsigned long nr_skipped[MAX_NR_ZONES] = { 0, };
- unsigned long scan, nr_pages;
- LIST_HEAD(pages_skipped);
- for (scan = 0; scan < nr_to_scan && nr_taken < nr_to_scan &&
- !list_empty(src);) {
- struct page *page;
- page = lru_to_page(src);
- prefetchw_prev_lru_page(page, src, flags);
- VM_BUG_ON_PAGE(!PageLRU(page), page);
- if (page_zonenum(page) > sc->reclaim_idx) {
- list_move(&page->lru, &pages_skipped);
- nr_skipped[page_zonenum(page)]++;
- continue;
- }
-
- scan++;
- switch (__isolate_lru_page(page, mode)) {
- case 0:
- nr_pages = hpage_nr_pages(page);
- nr_taken += nr_pages;
- nr_zone_taken[page_zonenum(page)] += nr_pages;
- list_move(&page->lru, dst);
- break;
- case -EBUSY:
-
- list_move(&page->lru, src);
- continue;
- default:
- BUG();
- }
- }
-
- if (!list_empty(&pages_skipped)) {
- int zid;
- unsigned long total_skipped = 0;
- for (zid = 0; zid < MAX_NR_ZONES; zid++) {
- if (!nr_skipped[zid])
- continue;
- __count_zid_vm_events(PGSCAN_SKIP, zid, nr_skipped[zid]);
- total_skipped += nr_skipped[zid];
- }
-
- scan += list_empty(src) ? total_skipped : total_skipped >> 2;
- list_splice(&pages_skipped, src);
- }
- *nr_scanned = scan;
- trace_mm_vmscan_lru_isolate(sc->reclaim_idx, sc->order, nr_to_scan, scan,
- nr_taken, mode, is_file_lru(lru));
- update_lru_sizes(lruvec, lru, nr_zone_taken);
- return nr_taken;
- }
- int isolate_lru_page(struct page *page)
- {
- int ret = -EBUSY;
- VM_BUG_ON_PAGE(!page_count(page), page);
- WARN_RATELIMIT(PageTail(page), "trying to isolate tail page");
- if (PageLRU(page)) {
- struct zone *zone = page_zone(page);
- struct lruvec *lruvec;
- spin_lock_irq(zone_lru_lock(zone));
- lruvec = mem_cgroup_page_lruvec(page, zone->zone_pgdat);
- if (PageLRU(page)) {
- int lru = page_lru(page);
- get_page(page);
- ClearPageLRU(page);
- del_page_from_lru_list(page, lruvec, lru);
- ret = 0;
- }
- spin_unlock_irq(zone_lru_lock(zone));
- }
- return ret;
- }
- static int too_many_isolated(struct pglist_data *pgdat, int file,
- struct scan_control *sc)
- {
- unsigned long inactive, isolated;
- if (current_is_kswapd())
- return 0;
- if (!sane_reclaim(sc))
- return 0;
- if (file) {
- inactive = node_page_state(pgdat, NR_INACTIVE_FILE);
- isolated = node_page_state(pgdat, NR_ISOLATED_FILE);
- } else {
- inactive = node_page_state(pgdat, NR_INACTIVE_ANON);
- isolated = node_page_state(pgdat, NR_ISOLATED_ANON);
- }
-
- if ((sc->gfp_mask & (__GFP_IO | __GFP_FS)) == (__GFP_IO | __GFP_FS))
- inactive >>= 3;
- return isolated > inactive;
- }
- static noinline_for_stack void
- putback_inactive_pages(struct lruvec *lruvec, struct list_head *page_list)
- {
- struct zone_reclaim_stat *reclaim_stat = &lruvec->reclaim_stat;
- struct pglist_data *pgdat = lruvec_pgdat(lruvec);
- LIST_HEAD(pages_to_free);
-
- while (!list_empty(page_list)) {
- struct page *page = lru_to_page(page_list);
- int lru;
- VM_BUG_ON_PAGE(PageLRU(page), page);
- list_del(&page->lru);
- if (unlikely(!page_evictable(page))) {
- spin_unlock_irq(&pgdat->lru_lock);
- putback_lru_page(page);
- spin_lock_irq(&pgdat->lru_lock);
- continue;
- }
- lruvec = mem_cgroup_page_lruvec(page, pgdat);
- SetPageLRU(page);
- lru = page_lru(page);
- add_page_to_lru_list(page, lruvec, lru);
- if (is_active_lru(lru)) {
- int file = is_file_lru(lru);
- int numpages = hpage_nr_pages(page);
- reclaim_stat->recent_rotated[file] += numpages;
- }
- if (put_page_testzero(page)) {
- __ClearPageLRU(page);
- __ClearPageActive(page);
- del_page_from_lru_list(page, lruvec, lru);
- if (unlikely(PageCompound(page))) {
- spin_unlock_irq(&pgdat->lru_lock);
- mem_cgroup_uncharge(page);
- (*get_compound_page_dtor(page))(page);
- spin_lock_irq(&pgdat->lru_lock);
- } else
- list_add(&page->lru, &pages_to_free);
- }
- }
-
- list_splice(&pages_to_free, page_list);
- }
- static int current_may_throttle(void)
- {
- return !(current->flags & PF_LESS_THROTTLE) ||
- current->backing_dev_info == NULL ||
- bdi_write_congested(current->backing_dev_info);
- }
- static bool inactive_reclaimable_pages(struct lruvec *lruvec,
- struct scan_control *sc, enum lru_list lru)
- {
- int zid;
- struct zone *zone;
- int file = is_file_lru(lru);
- struct pglist_data *pgdat = lruvec_pgdat(lruvec);
- if (!global_reclaim(sc))
- return true;
- for (zid = sc->reclaim_idx; zid >= 0; zid--) {
- zone = &pgdat->node_zones[zid];
- if (!managed_zone(zone))
- continue;
- if (zone_page_state_snapshot(zone, NR_ZONE_LRU_BASE +
- LRU_FILE * file) >= SWAP_CLUSTER_MAX)
- return true;
- }
- return false;
- }
- static noinline_for_stack unsigned long
- shrink_inactive_list(unsigned long nr_to_scan, struct lruvec *lruvec,
- struct scan_control *sc, enum lru_list lru)
- {
- LIST_HEAD(page_list);
- unsigned long nr_scanned;
- unsigned long nr_reclaimed = 0;
- unsigned long nr_taken;
- unsigned long nr_dirty = 0;
- unsigned long nr_congested = 0;
- unsigned long nr_unqueued_dirty = 0;
- unsigned long nr_writeback = 0;
- unsigned long nr_immediate = 0;
- isolate_mode_t isolate_mode = 0;
- int file = is_file_lru(lru);
- struct pglist_data *pgdat = lruvec_pgdat(lruvec);
- struct zone_reclaim_stat *reclaim_stat = &lruvec->reclaim_stat;
- if (!inactive_reclaimable_pages(lruvec, sc, lru))
- return 0;
- while (unlikely(too_many_isolated(pgdat, file, sc))) {
- congestion_wait(BLK_RW_ASYNC, HZ/10);
-
- if (fatal_signal_pending(current))
- return SWAP_CLUSTER_MAX;
- }
- lru_add_drain();
- if (!sc->may_unmap)
- isolate_mode |= ISOLATE_UNMAPPED;
- if (!sc->may_writepage)
- isolate_mode |= ISOLATE_CLEAN;
- spin_lock_irq(&pgdat->lru_lock);
- nr_taken = isolate_lru_pages(nr_to_scan, lruvec, &page_list,
- &nr_scanned, sc, isolate_mode, lru);
- __mod_node_page_state(pgdat, NR_ISOLATED_ANON + file, nr_taken);
- reclaim_stat->recent_scanned[file] += nr_taken;
- if (global_reclaim(sc)) {
- __mod_node_page_state(pgdat, NR_PAGES_SCANNED, nr_scanned);
- if (current_is_kswapd())
- __count_vm_events(PGSCAN_KSWAPD, nr_scanned);
- else
- __count_vm_events(PGSCAN_DIRECT, nr_scanned);
- }
- spin_unlock_irq(&pgdat->lru_lock);
- if (nr_taken == 0)
- return 0;
- nr_reclaimed = shrink_page_list(&page_list, pgdat, sc, TTU_UNMAP,
- &nr_dirty, &nr_unqueued_dirty, &nr_congested,
- &nr_writeback, &nr_immediate,
- false);
- spin_lock_irq(&pgdat->lru_lock);
- if (global_reclaim(sc)) {
- if (current_is_kswapd())
- __count_vm_events(PGSTEAL_KSWAPD, nr_reclaimed);
- else
- __count_vm_events(PGSTEAL_DIRECT, nr_reclaimed);
- }
- putback_inactive_pages(lruvec, &page_list);
- __mod_node_page_state(pgdat, NR_ISOLATED_ANON + file, -nr_taken);
- spin_unlock_irq(&pgdat->lru_lock);
- mem_cgroup_uncharge_list(&page_list);
- free_hot_cold_page_list(&page_list, true);
-
- if (nr_writeback && nr_writeback == nr_taken)
- set_bit(PGDAT_WRITEBACK, &pgdat->flags);
-
- if (sane_reclaim(sc)) {
-
- if (nr_dirty && nr_dirty == nr_congested)
- set_bit(PGDAT_CONGESTED, &pgdat->flags);
-
- if (nr_unqueued_dirty == nr_taken)
- set_bit(PGDAT_DIRTY, &pgdat->flags);
-
- if (nr_immediate && current_may_throttle())
- congestion_wait(BLK_RW_ASYNC, HZ/10);
- }
-
- if (!sc->hibernation_mode && !current_is_kswapd() &&
- current_may_throttle())
- wait_iff_congested(pgdat, BLK_RW_ASYNC, HZ/10);
- trace_mm_vmscan_lru_shrink_inactive(pgdat->node_id,
- nr_scanned, nr_reclaimed,
- sc->priority, file);
- return nr_reclaimed;
- }
- static void move_active_pages_to_lru(struct lruvec *lruvec,
- struct list_head *list,
- struct list_head *pages_to_free,
- enum lru_list lru)
- {
- struct pglist_data *pgdat = lruvec_pgdat(lruvec);
- unsigned long pgmoved = 0;
- struct page *page;
- int nr_pages;
- while (!list_empty(list)) {
- page = lru_to_page(list);
- lruvec = mem_cgroup_page_lruvec(page, pgdat);
- VM_BUG_ON_PAGE(PageLRU(page), page);
- SetPageLRU(page);
- nr_pages = hpage_nr_pages(page);
- update_lru_size(lruvec, lru, page_zonenum(page), nr_pages);
- list_move(&page->lru, &lruvec->lists[lru]);
- pgmoved += nr_pages;
- if (put_page_testzero(page)) {
- __ClearPageLRU(page);
- __ClearPageActive(page);
- del_page_from_lru_list(page, lruvec, lru);
- if (unlikely(PageCompound(page))) {
- spin_unlock_irq(&pgdat->lru_lock);
- mem_cgroup_uncharge(page);
- (*get_compound_page_dtor(page))(page);
- spin_lock_irq(&pgdat->lru_lock);
- } else
- list_add(&page->lru, pages_to_free);
- }
- }
- if (!is_active_lru(lru))
- __count_vm_events(PGDEACTIVATE, pgmoved);
- }
- static void shrink_active_list(unsigned long nr_to_scan,
- struct lruvec *lruvec,
- struct scan_control *sc,
- enum lru_list lru)
- {
- unsigned long nr_taken;
- unsigned long nr_scanned;
- unsigned long vm_flags;
- LIST_HEAD(l_hold);
- LIST_HEAD(l_active);
- LIST_HEAD(l_inactive);
- struct page *page;
- struct zone_reclaim_stat *reclaim_stat = &lruvec->reclaim_stat;
- unsigned long nr_rotated = 0;
- isolate_mode_t isolate_mode = 0;
- int file = is_file_lru(lru);
- struct pglist_data *pgdat = lruvec_pgdat(lruvec);
- lru_add_drain();
- if (!sc->may_unmap)
- isolate_mode |= ISOLATE_UNMAPPED;
- if (!sc->may_writepage)
- isolate_mode |= ISOLATE_CLEAN;
- spin_lock_irq(&pgdat->lru_lock);
- nr_taken = isolate_lru_pages(nr_to_scan, lruvec, &l_hold,
- &nr_scanned, sc, isolate_mode, lru);
- __mod_node_page_state(pgdat, NR_ISOLATED_ANON + file, nr_taken);
- reclaim_stat->recent_scanned[file] += nr_taken;
- if (global_reclaim(sc))
- __mod_node_page_state(pgdat, NR_PAGES_SCANNED, nr_scanned);
- __count_vm_events(PGREFILL, nr_scanned);
- spin_unlock_irq(&pgdat->lru_lock);
- while (!list_empty(&l_hold)) {
- cond_resched();
- page = lru_to_page(&l_hold);
- list_del(&page->lru);
- if (unlikely(!page_evictable(page))) {
- putback_lru_page(page);
- continue;
- }
- if (unlikely(buffer_heads_over_limit)) {
- if (page_has_private(page) && trylock_page(page)) {
- if (page_has_private(page))
- try_to_release_page(page, 0);
- unlock_page(page);
- }
- }
- if (page_referenced(page, 0, sc->target_mem_cgroup,
- &vm_flags)) {
- nr_rotated += hpage_nr_pages(page);
-
- if ((vm_flags & VM_EXEC) && page_is_file_cache(page)) {
- list_add(&page->lru, &l_active);
- continue;
- }
- }
- ClearPageActive(page);
- list_add(&page->lru, &l_inactive);
- }
-
- spin_lock_irq(&pgdat->lru_lock);
-
- reclaim_stat->recent_rotated[file] += nr_rotated;
- move_active_pages_to_lru(lruvec, &l_active, &l_hold, lru);
- move_active_pages_to_lru(lruvec, &l_inactive, &l_hold, lru - LRU_ACTIVE);
- __mod_node_page_state(pgdat, NR_ISOLATED_ANON + file, -nr_taken);
- spin_unlock_irq(&pgdat->lru_lock);
- mem_cgroup_uncharge_list(&l_hold);
- free_hot_cold_page_list(&l_hold, true);
- }
- static bool inactive_list_is_low(struct lruvec *lruvec, bool file,
- struct scan_control *sc)
- {
- unsigned long inactive_ratio;
- unsigned long inactive, active;
- enum lru_list inactive_lru = file * LRU_FILE;
- enum lru_list active_lru = file * LRU_FILE + LRU_ACTIVE;
- unsigned long gb;
-
- if (!file && !total_swap_pages)
- return false;
- inactive = lruvec_lru_size(lruvec, inactive_lru, sc->reclaim_idx);
- active = lruvec_lru_size(lruvec, active_lru, sc->reclaim_idx);
- gb = (inactive + active) >> (30 - PAGE_SHIFT);
- if (gb)
- inactive_ratio = int_sqrt(10 * gb);
- else
- inactive_ratio = 1;
- return inactive * inactive_ratio < active;
- }
- static unsigned long shrink_list(enum lru_list lru, unsigned long nr_to_scan,
- struct lruvec *lruvec, struct scan_control *sc)
- {
- if (is_active_lru(lru)) {
- if (inactive_list_is_low(lruvec, is_file_lru(lru), sc))
- shrink_active_list(nr_to_scan, lruvec, sc, lru);
- return 0;
- }
- return shrink_inactive_list(nr_to_scan, lruvec, sc, lru);
- }
- enum scan_balance {
- SCAN_EQUAL,
- SCAN_FRACT,
- SCAN_ANON,
- SCAN_FILE,
- };
- static void get_scan_count(struct lruvec *lruvec, struct mem_cgroup *memcg,
- struct scan_control *sc, unsigned long *nr,
- unsigned long *lru_pages)
- {
- int swappiness = mem_cgroup_swappiness(memcg);
- struct zone_reclaim_stat *reclaim_stat = &lruvec->reclaim_stat;
- u64 fraction[2];
- u64 denominator = 0;
- struct pglist_data *pgdat = lruvec_pgdat(lruvec);
- unsigned long anon_prio, file_prio;
- enum scan_balance scan_balance;
- unsigned long anon, file;
- bool force_scan = false;
- unsigned long ap, fp;
- enum lru_list lru;
- bool some_scanned;
- int pass;
-
- if (current_is_kswapd()) {
- if (!pgdat_reclaimable(pgdat))
- force_scan = true;
- if (!mem_cgroup_online(memcg))
- force_scan = true;
- }
- if (!global_reclaim(sc))
- force_scan = true;
-
- if (!sc->may_swap || mem_cgroup_get_nr_swap_pages(memcg) <= 0) {
- scan_balance = SCAN_FILE;
- goto out;
- }
-
- if (!global_reclaim(sc) && !swappiness) {
- scan_balance = SCAN_FILE;
- goto out;
- }
-
- if (!sc->priority && swappiness) {
- scan_balance = SCAN_EQUAL;
- goto out;
- }
-
- if (global_reclaim(sc)) {
- unsigned long pgdatfile;
- unsigned long pgdatfree;
- int z;
- unsigned long total_high_wmark = 0;
- pgdatfree = sum_zone_node_page_state(pgdat->node_id, NR_FREE_PAGES);
- pgdatfile = node_page_state(pgdat, NR_ACTIVE_FILE) +
- node_page_state(pgdat, NR_INACTIVE_FILE);
- for (z = 0; z < MAX_NR_ZONES; z++) {
- struct zone *zone = &pgdat->node_zones[z];
- if (!managed_zone(zone))
- continue;
- total_high_wmark += high_wmark_pages(zone);
- }
- if (unlikely(pgdatfile + pgdatfree <= total_high_wmark)) {
- scan_balance = SCAN_ANON;
- goto out;
- }
- }
-
- if (!inactive_list_is_low(lruvec, true, sc) &&
- lruvec_lru_size(lruvec, LRU_INACTIVE_FILE, sc->reclaim_idx) >> sc->priority) {
- scan_balance = SCAN_FILE;
- goto out;
- }
- scan_balance = SCAN_FRACT;
-
- anon_prio = swappiness;
- file_prio = 200 - anon_prio;
-
- anon = lruvec_lru_size(lruvec, LRU_ACTIVE_ANON, MAX_NR_ZONES) +
- lruvec_lru_size(lruvec, LRU_INACTIVE_ANON, MAX_NR_ZONES);
- file = lruvec_lru_size(lruvec, LRU_ACTIVE_FILE, MAX_NR_ZONES) +
- lruvec_lru_size(lruvec, LRU_INACTIVE_FILE, MAX_NR_ZONES);
- spin_lock_irq(&pgdat->lru_lock);
- if (unlikely(reclaim_stat->recent_scanned[0] > anon / 4)) {
- reclaim_stat->recent_scanned[0] /= 2;
- reclaim_stat->recent_rotated[0] /= 2;
- }
- if (unlikely(reclaim_stat->recent_scanned[1] > file / 4)) {
- reclaim_stat->recent_scanned[1] /= 2;
- reclaim_stat->recent_rotated[1] /= 2;
- }
-
- ap = anon_prio * (reclaim_stat->recent_scanned[0] + 1);
- ap /= reclaim_stat->recent_rotated[0] + 1;
- fp = file_prio * (reclaim_stat->recent_scanned[1] + 1);
- fp /= reclaim_stat->recent_rotated[1] + 1;
- spin_unlock_irq(&pgdat->lru_lock);
- fraction[0] = ap;
- fraction[1] = fp;
- denominator = ap + fp + 1;
- out:
- some_scanned = false;
-
- for (pass = 0; !some_scanned && pass < 2; pass++) {
- *lru_pages = 0;
- for_each_evictable_lru(lru) {
- int file = is_file_lru(lru);
- unsigned long size;
- unsigned long scan;
- size = lruvec_lru_size(lruvec, lru, sc->reclaim_idx);
- scan = size >> sc->priority;
- if (!scan && pass && force_scan)
- scan = min(size, SWAP_CLUSTER_MAX);
- switch (scan_balance) {
- case SCAN_EQUAL:
-
- break;
- case SCAN_FRACT:
-
- scan = div64_u64(scan * fraction[file],
- denominator);
- break;
- case SCAN_FILE:
- case SCAN_ANON:
-
- if ((scan_balance == SCAN_FILE) != file) {
- size = 0;
- scan = 0;
- }
- break;
- default:
-
- BUG();
- }
- *lru_pages += size;
- nr[lru] = scan;
-
- some_scanned |= !!scan;
- }
- }
- }
- static void shrink_node_memcg(struct pglist_data *pgdat, struct mem_cgroup *memcg,
- struct scan_control *sc, unsigned long *lru_pages)
- {
- struct lruvec *lruvec = mem_cgroup_lruvec(pgdat, memcg);
- unsigned long nr[NR_LRU_LISTS];
- unsigned long targets[NR_LRU_LISTS];
- unsigned long nr_to_scan;
- enum lru_list lru;
- unsigned long nr_reclaimed = 0;
- unsigned long nr_to_reclaim = sc->nr_to_reclaim;
- struct blk_plug plug;
- bool scan_adjusted;
- get_scan_count(lruvec, memcg, sc, nr, lru_pages);
-
- memcpy(targets, nr, sizeof(nr));
-
- scan_adjusted = (global_reclaim(sc) && !current_is_kswapd() &&
- sc->priority == DEF_PRIORITY);
- blk_start_plug(&plug);
- while (nr[LRU_INACTIVE_ANON] || nr[LRU_ACTIVE_FILE] ||
- nr[LRU_INACTIVE_FILE]) {
- unsigned long nr_anon, nr_file, percentage;
- unsigned long nr_scanned;
- for_each_evictable_lru(lru) {
- if (nr[lru]) {
- nr_to_scan = min(nr[lru], SWAP_CLUSTER_MAX);
- nr[lru] -= nr_to_scan;
- nr_reclaimed += shrink_list(lru, nr_to_scan,
- lruvec, sc);
- }
- }
- cond_resched();
- if (nr_reclaimed < nr_to_reclaim || scan_adjusted)
- continue;
-
- nr_file = nr[LRU_INACTIVE_FILE] + nr[LRU_ACTIVE_FILE];
- nr_anon = nr[LRU_INACTIVE_ANON] + nr[LRU_ACTIVE_ANON];
-
- if (!nr_file || !nr_anon)
- break;
- if (nr_file > nr_anon) {
- unsigned long scan_target = targets[LRU_INACTIVE_ANON] +
- targets[LRU_ACTIVE_ANON] + 1;
- lru = LRU_BASE;
- percentage = nr_anon * 100 / scan_target;
- } else {
- unsigned long scan_target = targets[LRU_INACTIVE_FILE] +
- targets[LRU_ACTIVE_FILE] + 1;
- lru = LRU_FILE;
- percentage = nr_file * 100 / scan_target;
- }
-
- nr[lru] = 0;
- nr[lru + LRU_ACTIVE] = 0;
-
- lru = (lru == LRU_FILE) ? LRU_BASE : LRU_FILE;
- nr_scanned = targets[lru] - nr[lru];
- nr[lru] = targets[lru] * (100 - percentage) / 100;
- nr[lru] -= min(nr[lru], nr_scanned);
- lru += LRU_ACTIVE;
- nr_scanned = targets[lru] - nr[lru];
- nr[lru] = targets[lru] * (100 - percentage) / 100;
- nr[lru] -= min(nr[lru], nr_scanned);
- scan_adjusted = true;
- }
- blk_finish_plug(&plug);
- sc->nr_reclaimed += nr_reclaimed;
-
- if (inactive_list_is_low(lruvec, false, sc))
- shrink_active_list(SWAP_CLUSTER_MAX, lruvec,
- sc, LRU_ACTIVE_ANON);
- }
- static bool in_reclaim_compaction(struct scan_control *sc)
- {
- if (IS_ENABLED(CONFIG_COMPACTION) && sc->order &&
- (sc->order > PAGE_ALLOC_COSTLY_ORDER ||
- sc->priority < DEF_PRIORITY - 2))
- return true;
- return false;
- }
- static inline bool should_continue_reclaim(struct pglist_data *pgdat,
- unsigned long nr_reclaimed,
- unsigned long nr_scanned,
- struct scan_control *sc)
- {
- unsigned long pages_for_compaction;
- unsigned long inactive_lru_pages;
- int z;
-
- if (!in_reclaim_compaction(sc))
- return false;
-
- if (sc->gfp_mask & __GFP_REPEAT) {
-
- if (!nr_reclaimed && !nr_scanned)
- return false;
- } else {
-
- if (!nr_reclaimed)
- return false;
- }
-
- pages_for_compaction = compact_gap(sc->order);
- inactive_lru_pages = node_page_state(pgdat, NR_INACTIVE_FILE);
- if (get_nr_swap_pages() > 0)
- inactive_lru_pages += node_page_state(pgdat, NR_INACTIVE_ANON);
- if (sc->nr_reclaimed < pages_for_compaction &&
- inactive_lru_pages > pages_for_compaction)
- return true;
-
- for (z = 0; z <= sc->reclaim_idx; z++) {
- struct zone *zone = &pgdat->node_zones[z];
- if (!managed_zone(zone))
- continue;
- switch (compaction_suitable(zone, sc->order, 0, sc->reclaim_idx)) {
- case COMPACT_SUCCESS:
- case COMPACT_CONTINUE:
- return false;
- default:
-
- ;
- }
- }
- return true;
- }
- static bool shrink_node(pg_data_t *pgdat, struct scan_control *sc)
- {
- struct reclaim_state *reclaim_state = current->reclaim_state;
- unsigned long nr_reclaimed, nr_scanned;
- bool reclaimable = false;
- do {
- struct mem_cgroup *root = sc->target_mem_cgroup;
- struct mem_cgroup_reclaim_cookie reclaim = {
- .pgdat = pgdat,
- .priority = sc->priority,
- };
- unsigned long node_lru_pages = 0;
- struct mem_cgroup *memcg;
- nr_reclaimed = sc->nr_reclaimed;
- nr_scanned = sc->nr_scanned;
- memcg = mem_cgroup_iter(root, NULL, &reclaim);
- do {
- unsigned long lru_pages;
- unsigned long reclaimed;
- unsigned long scanned;
- if (mem_cgroup_low(root, memcg)) {
- if (!sc->may_thrash)
- continue;
- mem_cgroup_events(memcg, MEMCG_LOW, 1);
- }
- reclaimed = sc->nr_reclaimed;
- scanned = sc->nr_scanned;
- shrink_node_memcg(pgdat, memcg, sc, &lru_pages);
- node_lru_pages += lru_pages;
- if (memcg)
- shrink_slab(sc->gfp_mask, pgdat->node_id,
- memcg, sc->nr_scanned - scanned,
- lru_pages);
-
- vmpressure(sc->gfp_mask, memcg, false,
- sc->nr_scanned - scanned,
- sc->nr_reclaimed - reclaimed);
-
- if (!global_reclaim(sc) &&
- sc->nr_reclaimed >= sc->nr_to_reclaim) {
- mem_cgroup_iter_break(root, memcg);
- break;
- }
- } while ((memcg = mem_cgroup_iter(root, memcg, &reclaim)));
-
- if (global_reclaim(sc))
- shrink_slab(sc->gfp_mask, pgdat->node_id, NULL,
- sc->nr_scanned - nr_scanned,
- node_lru_pages);
- if (reclaim_state) {
- sc->nr_reclaimed += reclaim_state->reclaimed_slab;
- reclaim_state->reclaimed_slab = 0;
- }
-
- vmpressure(sc->gfp_mask, sc->target_mem_cgroup, true,
- sc->nr_scanned - nr_scanned,
- sc->nr_reclaimed - nr_reclaimed);
- if (sc->nr_reclaimed - nr_reclaimed)
- reclaimable = true;
- } while (should_continue_reclaim(pgdat, sc->nr_reclaimed - nr_reclaimed,
- sc->nr_scanned - nr_scanned, sc));
- return reclaimable;
- }
- static inline bool compaction_ready(struct zone *zone, struct scan_control *sc)
- {
- unsigned long watermark;
- enum compact_result suitable;
- suitable = compaction_suitable(zone, sc->order, 0, sc->reclaim_idx);
- if (suitable == COMPACT_SUCCESS)
-
- return true;
- if (suitable == COMPACT_SKIPPED)
-
- return false;
-
- watermark = high_wmark_pages(zone) + compact_gap(sc->order);
- return zone_watermark_ok_safe(zone, 0, watermark, sc->reclaim_idx);
- }
- static void shrink_zones(struct zonelist *zonelist, struct scan_control *sc)
- {
- struct zoneref *z;
- struct zone *zone;
- unsigned long nr_soft_reclaimed;
- unsigned long nr_soft_scanned;
- gfp_t orig_mask;
- pg_data_t *last_pgdat = NULL;
-
- orig_mask = sc->gfp_mask;
- if (buffer_heads_over_limit) {
- sc->gfp_mask |= __GFP_HIGHMEM;
- sc->reclaim_idx = gfp_zone(sc->gfp_mask);
- }
- for_each_zone_zonelist_nodemask(zone, z, zonelist,
- sc->reclaim_idx, sc->nodemask) {
-
- if (global_reclaim(sc)) {
- if (!cpuset_zone_allowed(zone,
- GFP_KERNEL | __GFP_HARDWALL))
- continue;
- if (sc->priority != DEF_PRIORITY &&
- !pgdat_reclaimable(zone->zone_pgdat))
- continue;
-
- if (IS_ENABLED(CONFIG_COMPACTION) &&
- sc->order > PAGE_ALLOC_COSTLY_ORDER &&
- compaction_ready(zone, sc)) {
- sc->compaction_ready = true;
- continue;
- }
-
- if (zone->zone_pgdat == last_pgdat)
- continue;
-
- nr_soft_scanned = 0;
- nr_soft_reclaimed = mem_cgroup_soft_limit_reclaim(zone->zone_pgdat,
- sc->order, sc->gfp_mask,
- &nr_soft_scanned);
- sc->nr_reclaimed += nr_soft_reclaimed;
- sc->nr_scanned += nr_soft_scanned;
-
- }
-
- if (zone->zone_pgdat == last_pgdat)
- continue;
- last_pgdat = zone->zone_pgdat;
- shrink_node(zone->zone_pgdat, sc);
- }
-
- sc->gfp_mask = orig_mask;
- }
- static unsigned long do_try_to_free_pages(struct zonelist *zonelist,
- struct scan_control *sc)
- {
- int initial_priority = sc->priority;
- unsigned long total_scanned = 0;
- unsigned long writeback_threshold;
- retry:
- delayacct_freepages_start();
- if (global_reclaim(sc))
- __count_zid_vm_events(ALLOCSTALL, sc->reclaim_idx, 1);
- do {
- vmpressure_prio(sc->gfp_mask, sc->target_mem_cgroup,
- sc->priority);
- sc->nr_scanned = 0;
- shrink_zones(zonelist, sc);
- total_scanned += sc->nr_scanned;
- if (sc->nr_reclaimed >= sc->nr_to_reclaim)
- break;
- if (sc->compaction_ready)
- break;
-
- if (sc->priority < DEF_PRIORITY - 2)
- sc->may_writepage = 1;
-
- writeback_threshold = sc->nr_to_reclaim + sc->nr_to_reclaim / 2;
- if (total_scanned > writeback_threshold) {
- wakeup_flusher_threads(laptop_mode ? 0 : total_scanned,
- WB_REASON_TRY_TO_FREE_PAGES);
- sc->may_writepage = 1;
- }
- } while (--sc->priority >= 0);
- delayacct_freepages_end();
- if (sc->nr_reclaimed)
- return sc->nr_reclaimed;
-
- if (sc->compaction_ready)
- return 1;
-
- if (!sc->may_thrash) {
- sc->priority = initial_priority;
- sc->may_thrash = 1;
- goto retry;
- }
- return 0;
- }
- static bool pfmemalloc_watermark_ok(pg_data_t *pgdat)
- {
- struct zone *zone;
- unsigned long pfmemalloc_reserve = 0;
- unsigned long free_pages = 0;
- int i;
- bool wmark_ok;
- for (i = 0; i <= ZONE_NORMAL; i++) {
- zone = &pgdat->node_zones[i];
- if (!managed_zone(zone) ||
- pgdat_reclaimable_pages(pgdat) == 0)
- continue;
- pfmemalloc_reserve += min_wmark_pages(zone);
- free_pages += zone_page_state(zone, NR_FREE_PAGES);
- }
-
- if (!pfmemalloc_reserve)
- return true;
- wmark_ok = free_pages > pfmemalloc_reserve / 2;
-
- if (!wmark_ok && waitqueue_active(&pgdat->kswapd_wait)) {
- pgdat->kswapd_classzone_idx = min(pgdat->kswapd_classzone_idx,
- (enum zone_type)ZONE_NORMAL);
- wake_up_interruptible(&pgdat->kswapd_wait);
- }
- return wmark_ok;
- }
- static bool throttle_direct_reclaim(gfp_t gfp_mask, struct zonelist *zonelist,
- nodemask_t *nodemask)
- {
- struct zoneref *z;
- struct zone *zone;
- pg_data_t *pgdat = NULL;
-
- if (current->flags & PF_KTHREAD)
- goto out;
-
- if (fatal_signal_pending(current))
- goto out;
-
- for_each_zone_zonelist_nodemask(zone, z, zonelist,
- gfp_zone(gfp_mask), nodemask) {
- if (zone_idx(zone) > ZONE_NORMAL)
- continue;
-
- pgdat = zone->zone_pgdat;
- if (pfmemalloc_watermark_ok(pgdat))
- goto out;
- break;
- }
-
- if (!pgdat)
- goto out;
-
- count_vm_event(PGSCAN_DIRECT_THROTTLE);
-
- if (!(gfp_mask & __GFP_FS)) {
- wait_event_interruptible_timeout(pgdat->pfmemalloc_wait,
- pfmemalloc_watermark_ok(pgdat), HZ);
- goto check_pending;
- }
-
- wait_event_killable(zone->zone_pgdat->pfmemalloc_wait,
- pfmemalloc_watermark_ok(pgdat));
- check_pending:
- if (fatal_signal_pending(current))
- return true;
- out:
- return false;
- }
- unsigned long try_to_free_pages(struct zonelist *zonelist, int order,
- gfp_t gfp_mask, nodemask_t *nodemask)
- {
- unsigned long nr_reclaimed;
- struct scan_control sc = {
- .nr_to_reclaim = SWAP_CLUSTER_MAX,
- .gfp_mask = (gfp_mask = memalloc_noio_flags(gfp_mask)),
- .reclaim_idx = gfp_zone(gfp_mask),
- .order = order,
- .nodemask = nodemask,
- .priority = DEF_PRIORITY,
- .may_writepage = !laptop_mode,
- .may_unmap = 1,
- .may_swap = 1,
- };
-
- if (throttle_direct_reclaim(gfp_mask, zonelist, nodemask))
- return 1;
- trace_mm_vmscan_direct_reclaim_begin(order,
- sc.may_writepage,
- gfp_mask,
- sc.reclaim_idx);
- nr_reclaimed = do_try_to_free_pages(zonelist, &sc);
- trace_mm_vmscan_direct_reclaim_end(nr_reclaimed);
- return nr_reclaimed;
- }
- #ifdef CONFIG_MEMCG
- unsigned long mem_cgroup_shrink_node(struct mem_cgroup *memcg,
- gfp_t gfp_mask, bool noswap,
- pg_data_t *pgdat,
- unsigned long *nr_scanned)
- {
- struct scan_control sc = {
- .nr_to_reclaim = SWAP_CLUSTER_MAX,
- .target_mem_cgroup = memcg,
- .may_writepage = !laptop_mode,
- .may_unmap = 1,
- .reclaim_idx = MAX_NR_ZONES - 1,
- .may_swap = !noswap,
- };
- unsigned long lru_pages;
- sc.gfp_mask = (gfp_mask & GFP_RECLAIM_MASK) |
- (GFP_HIGHUSER_MOVABLE & ~GFP_RECLAIM_MASK);
- trace_mm_vmscan_memcg_softlimit_reclaim_begin(sc.order,
- sc.may_writepage,
- sc.gfp_mask,
- sc.reclaim_idx);
-
- shrink_node_memcg(pgdat, memcg, &sc, &lru_pages);
- trace_mm_vmscan_memcg_softlimit_reclaim_end(sc.nr_reclaimed);
- *nr_scanned = sc.nr_scanned;
- return sc.nr_reclaimed;
- }
- unsigned long try_to_free_mem_cgroup_pages(struct mem_cgroup *memcg,
- unsigned long nr_pages,
- gfp_t gfp_mask,
- bool may_swap)
- {
- struct zonelist *zonelist;
- unsigned long nr_reclaimed;
- int nid;
- struct scan_control sc = {
- .nr_to_reclaim = max(nr_pages, SWAP_CLUSTER_MAX),
- .gfp_mask = (gfp_mask & GFP_RECLAIM_MASK) |
- (GFP_HIGHUSER_MOVABLE & ~GFP_RECLAIM_MASK),
- .reclaim_idx = MAX_NR_ZONES - 1,
- .target_mem_cgroup = memcg,
- .priority = DEF_PRIORITY,
- .may_writepage = !laptop_mode,
- .may_unmap = 1,
- .may_swap = may_swap,
- };
-
- nid = mem_cgroup_select_victim_node(memcg);
- zonelist = &NODE_DATA(nid)->node_zonelists[ZONELIST_FALLBACK];
- trace_mm_vmscan_memcg_reclaim_begin(0,
- sc.may_writepage,
- sc.gfp_mask,
- sc.reclaim_idx);
- current->flags |= PF_MEMALLOC;
- nr_reclaimed = do_try_to_free_pages(zonelist, &sc);
- current->flags &= ~PF_MEMALLOC;
- trace_mm_vmscan_memcg_reclaim_end(nr_reclaimed);
- return nr_reclaimed;
- }
- #endif
- static void age_active_anon(struct pglist_data *pgdat,
- struct scan_control *sc)
- {
- struct mem_cgroup *memcg;
- if (!total_swap_pages)
- return;
- memcg = mem_cgroup_iter(NULL, NULL, NULL);
- do {
- struct lruvec *lruvec = mem_cgroup_lruvec(pgdat, memcg);
- if (inactive_list_is_low(lruvec, false, sc))
- shrink_active_list(SWAP_CLUSTER_MAX, lruvec,
- sc, LRU_ACTIVE_ANON);
- memcg = mem_cgroup_iter(NULL, memcg, NULL);
- } while (memcg);
- }
- static bool zone_balanced(struct zone *zone, int order, int classzone_idx)
- {
- unsigned long mark = high_wmark_pages(zone);
- if (!zone_watermark_ok_safe(zone, order, mark, classzone_idx))
- return false;
-
- clear_bit(PGDAT_CONGESTED, &zone->zone_pgdat->flags);
- clear_bit(PGDAT_DIRTY, &zone->zone_pgdat->flags);
- return true;
- }
- static bool prepare_kswapd_sleep(pg_data_t *pgdat, int order, int classzone_idx)
- {
- int i;
-
- if (waitqueue_active(&pgdat->pfmemalloc_wait))
- wake_up_all(&pgdat->pfmemalloc_wait);
- for (i = 0; i <= classzone_idx; i++) {
- struct zone *zone = pgdat->node_zones + i;
- if (!managed_zone(zone))
- continue;
- if (!zone_balanced(zone, order, classzone_idx))
- return false;
- }
- return true;
- }
- static bool kswapd_shrink_node(pg_data_t *pgdat,
- struct scan_control *sc)
- {
- struct zone *zone;
- int z;
-
- sc->nr_to_reclaim = 0;
- for (z = 0; z <= sc->reclaim_idx; z++) {
- zone = pgdat->node_zones + z;
- if (!managed_zone(zone))
- continue;
- sc->nr_to_reclaim += max(high_wmark_pages(zone), SWAP_CLUSTER_MAX);
- }
-
- shrink_node(pgdat, sc);
-
- if (sc->order && sc->nr_reclaimed >= compact_gap(sc->order))
- sc->order = 0;
- return sc->nr_scanned >= sc->nr_to_reclaim;
- }
- static int balance_pgdat(pg_data_t *pgdat, int order, int classzone_idx)
- {
- int i;
- unsigned long nr_soft_reclaimed;
- unsigned long nr_soft_scanned;
- struct zone *zone;
- struct scan_control sc = {
- .gfp_mask = GFP_KERNEL,
- .order = order,
- .priority = DEF_PRIORITY,
- .may_writepage = !laptop_mode,
- .may_unmap = 1,
- .may_swap = 1,
- };
- count_vm_event(PAGEOUTRUN);
- do {
- bool raise_priority = true;
- sc.nr_reclaimed = 0;
- sc.reclaim_idx = classzone_idx;
-
- if (buffer_heads_over_limit) {
- for (i = MAX_NR_ZONES - 1; i >= 0; i--) {
- zone = pgdat->node_zones + i;
- if (!managed_zone(zone))
- continue;
- sc.reclaim_idx = i;
- break;
- }
- }
-
- for (i = classzone_idx; i >= 0; i--) {
- zone = pgdat->node_zones + i;
- if (!managed_zone(zone))
- continue;
- if (zone_balanced(zone, sc.order, classzone_idx))
- goto out;
- }
-
- age_active_anon(pgdat, &sc);
-
- if (sc.priority < DEF_PRIORITY - 2 || !pgdat_reclaimable(pgdat))
- sc.may_writepage = 1;
-
- sc.nr_scanned = 0;
- nr_soft_scanned = 0;
- nr_soft_reclaimed = mem_cgroup_soft_limit_reclaim(pgdat, sc.order,
- sc.gfp_mask, &nr_soft_scanned);
- sc.nr_reclaimed += nr_soft_reclaimed;
-
- if (kswapd_shrink_node(pgdat, &sc))
- raise_priority = false;
-
- if (waitqueue_active(&pgdat->pfmemalloc_wait) &&
- pfmemalloc_watermark_ok(pgdat))
- wake_up_all(&pgdat->pfmemalloc_wait);
-
- if (try_to_freeze() || kthread_should_stop())
- break;
-
- if (raise_priority || !sc.nr_reclaimed)
- sc.priority--;
- } while (sc.priority >= 1);
- out:
-
- return sc.order;
- }
- static void kswapd_try_to_sleep(pg_data_t *pgdat, int alloc_order, int reclaim_order,
- unsigned int classzone_idx)
- {
- long remaining = 0;
- DEFINE_WAIT(wait);
- if (freezing(current) || kthread_should_stop())
- return;
- prepare_to_wait(&pgdat->kswapd_wait, &wait, TASK_INTERRUPTIBLE);
-
- if (prepare_kswapd_sleep(pgdat, reclaim_order, classzone_idx)) {
-
- reset_isolation_suitable(pgdat);
-
- wakeup_kcompactd(pgdat, alloc_order, classzone_idx);
- remaining = schedule_timeout(HZ/10);
-
- if (remaining) {
- pgdat->kswapd_classzone_idx = max(pgdat->kswapd_classzone_idx, classzone_idx);
- pgdat->kswapd_order = max(pgdat->kswapd_order, reclaim_order);
- }
- finish_wait(&pgdat->kswapd_wait, &wait);
- prepare_to_wait(&pgdat->kswapd_wait, &wait, TASK_INTERRUPTIBLE);
- }
-
- if (!remaining &&
- prepare_kswapd_sleep(pgdat, reclaim_order, classzone_idx)) {
- trace_mm_vmscan_kswapd_sleep(pgdat->node_id);
-
- set_pgdat_percpu_threshold(pgdat, calculate_normal_threshold);
- if (!kthread_should_stop())
- schedule();
- set_pgdat_percpu_threshold(pgdat, calculate_pressure_threshold);
- } else {
- if (remaining)
- count_vm_event(KSWAPD_LOW_WMARK_HIT_QUICKLY);
- else
- count_vm_event(KSWAPD_HIGH_WMARK_HIT_QUICKLY);
- }
- finish_wait(&pgdat->kswapd_wait, &wait);
- }
- static int kswapd(void *p)
- {
- unsigned int alloc_order, reclaim_order, classzone_idx;
- pg_data_t *pgdat = (pg_data_t*)p;
- struct task_struct *tsk = current;
- struct reclaim_state reclaim_state = {
- .reclaimed_slab = 0,
- };
- const struct cpumask *cpumask = cpumask_of_node(pgdat->node_id);
- lockdep_set_current_reclaim_state(GFP_KERNEL);
- if (!cpumask_empty(cpumask))
- set_cpus_allowed_ptr(tsk, cpumask);
- current->reclaim_state = &reclaim_state;
-
- tsk->flags |= PF_MEMALLOC | PF_SWAPWRITE | PF_KSWAPD;
- set_freezable();
- pgdat->kswapd_order = alloc_order = reclaim_order = 0;
- pgdat->kswapd_classzone_idx = classzone_idx = 0;
- for ( ; ; ) {
- bool ret;
- kswapd_try_sleep:
- kswapd_try_to_sleep(pgdat, alloc_order, reclaim_order,
- classzone_idx);
-
- alloc_order = reclaim_order = pgdat->kswapd_order;
- classzone_idx = pgdat->kswapd_classzone_idx;
- pgdat->kswapd_order = 0;
- pgdat->kswapd_classzone_idx = 0;
- ret = try_to_freeze();
- if (kthread_should_stop())
- break;
-
- if (ret)
- continue;
-
- trace_mm_vmscan_kswapd_wake(pgdat->node_id, classzone_idx,
- alloc_order);
- reclaim_order = balance_pgdat(pgdat, alloc_order, classzone_idx);
- if (reclaim_order < alloc_order)
- goto kswapd_try_sleep;
- alloc_order = reclaim_order = pgdat->kswapd_order;
- classzone_idx = pgdat->kswapd_classzone_idx;
- }
- tsk->flags &= ~(PF_MEMALLOC | PF_SWAPWRITE | PF_KSWAPD);
- current->reclaim_state = NULL;
- lockdep_clear_current_reclaim_state();
- return 0;
- }
- void wakeup_kswapd(struct zone *zone, int order, enum zone_type classzone_idx)
- {
- pg_data_t *pgdat;
- int z;
- if (!managed_zone(zone))
- return;
- if (!cpuset_zone_allowed(zone, GFP_KERNEL | __GFP_HARDWALL))
- return;
- pgdat = zone->zone_pgdat;
- pgdat->kswapd_classzone_idx = max(pgdat->kswapd_classzone_idx, classzone_idx);
- pgdat->kswapd_order = max(pgdat->kswapd_order, order);
- if (!waitqueue_active(&pgdat->kswapd_wait))
- return;
-
- for (z = 0; z <= classzone_idx; z++) {
- zone = pgdat->node_zones + z;
- if (!managed_zone(zone))
- continue;
- if (zone_balanced(zone, order, classzone_idx))
- return;
- }
- trace_mm_vmscan_wakeup_kswapd(pgdat->node_id, zone_idx(zone), order);
- wake_up_interruptible(&pgdat->kswapd_wait);
- }
- #ifdef CONFIG_HIBERNATION
- unsigned long shrink_all_memory(unsigned long nr_to_reclaim)
- {
- struct reclaim_state reclaim_state;
- struct scan_control sc = {
- .nr_to_reclaim = nr_to_reclaim,
- .gfp_mask = GFP_HIGHUSER_MOVABLE,
- .reclaim_idx = MAX_NR_ZONES - 1,
- .priority = DEF_PRIORITY,
- .may_writepage = 1,
- .may_unmap = 1,
- .may_swap = 1,
- .hibernation_mode = 1,
- };
- struct zonelist *zonelist = node_zonelist(numa_node_id(), sc.gfp_mask);
- struct task_struct *p = current;
- unsigned long nr_reclaimed;
- p->flags |= PF_MEMALLOC;
- lockdep_set_current_reclaim_state(sc.gfp_mask);
- reclaim_state.reclaimed_slab = 0;
- p->reclaim_state = &reclaim_state;
- nr_reclaimed = do_try_to_free_pages(zonelist, &sc);
- p->reclaim_state = NULL;
- lockdep_clear_current_reclaim_state();
- p->flags &= ~PF_MEMALLOC;
- return nr_reclaimed;
- }
- #endif
- static int cpu_callback(struct notifier_block *nfb, unsigned long action,
- void *hcpu)
- {
- int nid;
- if (action == CPU_ONLINE || action == CPU_ONLINE_FROZEN) {
- for_each_node_state(nid, N_MEMORY) {
- pg_data_t *pgdat = NODE_DATA(nid);
- const struct cpumask *mask;
- mask = cpumask_of_node(pgdat->node_id);
- if (cpumask_any_and(cpu_online_mask, mask) < nr_cpu_ids)
-
- set_cpus_allowed_ptr(pgdat->kswapd, mask);
- }
- }
- return NOTIFY_OK;
- }
- int kswapd_run(int nid)
- {
- pg_data_t *pgdat = NODE_DATA(nid);
- int ret = 0;
- if (pgdat->kswapd)
- return 0;
- pgdat->kswapd = kthread_run(kswapd, pgdat, "kswapd%d", nid);
- if (IS_ERR(pgdat->kswapd)) {
-
- BUG_ON(system_state == SYSTEM_BOOTING);
- pr_err("Failed to start kswapd on node %d\n", nid);
- ret = PTR_ERR(pgdat->kswapd);
- pgdat->kswapd = NULL;
- }
- return ret;
- }
- void kswapd_stop(int nid)
- {
- struct task_struct *kswapd = NODE_DATA(nid)->kswapd;
- if (kswapd) {
- kthread_stop(kswapd);
- NODE_DATA(nid)->kswapd = NULL;
- }
- }
- static int __init kswapd_init(void)
- {
- int nid;
- swap_setup();
- for_each_node_state(nid, N_MEMORY)
- kswapd_run(nid);
- hotcpu_notifier(cpu_callback, 0);
- return 0;
- }
- module_init(kswapd_init)
- #ifdef CONFIG_NUMA
- int node_reclaim_mode __read_mostly;
- #define RECLAIM_OFF 0
- #define RECLAIM_ZONE (1<<0)
- #define RECLAIM_WRITE (1<<1)
- #define RECLAIM_UNMAP (1<<2)
- #define NODE_RECLAIM_PRIORITY 4
- int sysctl_min_unmapped_ratio = 1;
- int sysctl_min_slab_ratio = 5;
- static inline unsigned long node_unmapped_file_pages(struct pglist_data *pgdat)
- {
- unsigned long file_mapped = node_page_state(pgdat, NR_FILE_MAPPED);
- unsigned long file_lru = node_page_state(pgdat, NR_INACTIVE_FILE) +
- node_page_state(pgdat, NR_ACTIVE_FILE);
-
- return (file_lru > file_mapped) ? (file_lru - file_mapped) : 0;
- }
- static unsigned long node_pagecache_reclaimable(struct pglist_data *pgdat)
- {
- unsigned long nr_pagecache_reclaimable;
- unsigned long delta = 0;
-
- if (node_reclaim_mode & RECLAIM_UNMAP)
- nr_pagecache_reclaimable = node_page_state(pgdat, NR_FILE_PAGES);
- else
- nr_pagecache_reclaimable = node_unmapped_file_pages(pgdat);
-
- if (!(node_reclaim_mode & RECLAIM_WRITE))
- delta += node_page_state(pgdat, NR_FILE_DIRTY);
-
- if (unlikely(delta > nr_pagecache_reclaimable))
- delta = nr_pagecache_reclaimable;
- return nr_pagecache_reclaimable - delta;
- }
- static int __node_reclaim(struct pglist_data *pgdat, gfp_t gfp_mask, unsigned int order)
- {
-
- const unsigned long nr_pages = 1 << order;
- struct task_struct *p = current;
- struct reclaim_state reclaim_state;
- int classzone_idx = gfp_zone(gfp_mask);
- struct scan_control sc = {
- .nr_to_reclaim = max(nr_pages, SWAP_CLUSTER_MAX),
- .gfp_mask = (gfp_mask = memalloc_noio_flags(gfp_mask)),
- .order = order,
- .priority = NODE_RECLAIM_PRIORITY,
- .may_writepage = !!(node_reclaim_mode & RECLAIM_WRITE),
- .may_unmap = !!(node_reclaim_mode & RECLAIM_UNMAP),
- .may_swap = 1,
- .reclaim_idx = classzone_idx,
- };
- cond_resched();
-
- p->flags |= PF_MEMALLOC | PF_SWAPWRITE;
- lockdep_set_current_reclaim_state(gfp_mask);
- reclaim_state.reclaimed_slab = 0;
- p->reclaim_state = &reclaim_state;
- if (node_pagecache_reclaimable(pgdat) > pgdat->min_unmapped_pages) {
-
- do {
- shrink_node(pgdat, &sc);
- } while (sc.nr_reclaimed < nr_pages && --sc.priority >= 0);
- }
- p->reclaim_state = NULL;
- current->flags &= ~(PF_MEMALLOC | PF_SWAPWRITE);
- lockdep_clear_current_reclaim_state();
- return sc.nr_reclaimed >= nr_pages;
- }
- int node_reclaim(struct pglist_data *pgdat, gfp_t gfp_mask, unsigned int order)
- {
- int ret;
-
- if (node_pagecache_reclaimable(pgdat) <= pgdat->min_unmapped_pages &&
- sum_zone_node_page_state(pgdat->node_id, NR_SLAB_RECLAIMABLE) <= pgdat->min_slab_pages)
- return NODE_RECLAIM_FULL;
- if (!pgdat_reclaimable(pgdat))
- return NODE_RECLAIM_FULL;
-
- if (!gfpflags_allow_blocking(gfp_mask) || (current->flags & PF_MEMALLOC))
- return NODE_RECLAIM_NOSCAN;
-
- if (node_state(pgdat->node_id, N_CPU) && pgdat->node_id != numa_node_id())
- return NODE_RECLAIM_NOSCAN;
- if (test_and_set_bit(PGDAT_RECLAIM_LOCKED, &pgdat->flags))
- return NODE_RECLAIM_NOSCAN;
- ret = __node_reclaim(pgdat, gfp_mask, order);
- clear_bit(PGDAT_RECLAIM_LOCKED, &pgdat->flags);
- if (!ret)
- count_vm_event(PGSCAN_ZONE_RECLAIM_FAILED);
- return ret;
- }
- #endif
- int page_evictable(struct page *page)
- {
- return !mapping_unevictable(page_mapping(page)) && !PageMlocked(page);
- }
- #ifdef CONFIG_SHMEM
- void check_move_unevictable_pages(struct page **pages, int nr_pages)
- {
- struct lruvec *lruvec;
- struct pglist_data *pgdat = NULL;
- int pgscanned = 0;
- int pgrescued = 0;
- int i;
- for (i = 0; i < nr_pages; i++) {
- struct page *page = pages[i];
- struct pglist_data *pagepgdat = page_pgdat(page);
- pgscanned++;
- if (pagepgdat != pgdat) {
- if (pgdat)
- spin_unlock_irq(&pgdat->lru_lock);
- pgdat = pagepgdat;
- spin_lock_irq(&pgdat->lru_lock);
- }
- lruvec = mem_cgroup_page_lruvec(page, pgdat);
- if (!PageLRU(page) || !PageUnevictable(page))
- continue;
- if (page_evictable(page)) {
- enum lru_list lru = page_lru_base_type(page);
- VM_BUG_ON_PAGE(PageActive(page), page);
- ClearPageUnevictable(page);
- del_page_from_lru_list(page, lruvec, LRU_UNEVICTABLE);
- add_page_to_lru_list(page, lruvec, lru);
- pgrescued++;
- }
- }
- if (pgdat) {
- __count_vm_events(UNEVICTABLE_PGRESCUED, pgrescued);
- __count_vm_events(UNEVICTABLE_PGSCANNED, pgscanned);
- spin_unlock_irq(&pgdat->lru_lock);
- }
- }
- #endif
|