mirror of
https://git.kernel.org/pub/scm/linux/kernel/git/stable/linux.git
synced 2026-05-20 14:35:06 +02:00
6ebf98d71f
CONFIG_MEMORY_HOTREMOVE, CONFIG_COMPACTION and CONFIG_CMA all select CONFIG_MIGRATION, because they require it to work (users). Only CONFIG_NUMA_BALANCING and CONFIG_BALLOON_MIGRATION depend on CONFIG_MIGRATION. CONFIG_BALLOON_MIGRATION is not an actual user, but an implementation of migration support, so the dependency is correct (CONFIG_BALLOON_MIGRATION does not make any sense without CONFIG_MIGRATION). However, kconfig-language.rst clearly states "In general use select only for non-visible symbols". So far CONFIG_MIGRATION is user-visible ... and the dependencies rather confusing. The whole reason why CONFIG_MIGRATION is user-visible is because of CONFIG_NUMA: some users might want CONFIG_NUMA but not page migration support. Let's clean all that up by introducing a dedicated CONFIG_NUMA_MIGRATION config option for that purpose only. Make CONFIG_NUMA_BALANCING that so far depended on CONFIG_NUMA && CONFIG_MIGRATION to depend on CONFIG_MIGRATION instead. CONFIG_NUMA_MIGRATION will depend on CONFIG_NUMA && CONFIG_MMU. CONFIG_NUMA_MIGRATION is user-visible and will default to "y". We use that default so new configs will automatically enable it, just like it was the case with CONFIG_MIGRATION. The downside is that some configs that used to have CONFIG_MIGRATION=n might get it re-enabled by CONFIG_NUMA_MIGRATION=y, which shouldn't be a problem. CONFIG_MIGRATION is now a non-visible config option. Any code that select CONFIG_MIGRATION (as before) must depend directly or indirectly on CONFIG_MMU. CONFIG_NUMA_MIGRATION is responsible for any NUMA migration code, which is mempolicy migration code, memory-tiering code, and move_pages() code in migrate.c. CONFIG_NUMA_BALANCING uses its functionality. Note that this implies that with CONFIG_NUMA_MIGRATION=n, move_pages() will not be available even though CONFIG_MIGRATION=y, which is an expected change. In migrate.c, we can remove the CONFIG_NUMA check as both CONFIG_NUMA_MIGRATION and CONFIG_NUMA_BALANCING depend on it. With this change, CONFIG_MIGRATION is an internal config, all users of migration selects CONFIG_MIGRATION, and only CONFIG_BALLOON_MIGRATION depends on it. Link: https://lkml.kernel.org/r/20260319-config_migration-v1-2-42270124966f@kernel.org Signed-off-by: David Hildenbrand (Arm) <david@kernel.org> Reviewed-by: Lorenzo Stoakes (Oracle) <ljs@kernel.org> Acked-by: Zi Yan <ziy@nvidia.com> Reviewed-by: Jonathan Cameron <jonathan.cameron@huawei.com> Cc: Albert Ou <aou@eecs.berkeley.edu> Cc: Alexander Gordeev <agordeev@linux.ibm.com> Cc: Alexandre Ghiti <alex@ghiti.fr> Cc: Alistair Popple <apopple@nvidia.com> Cc: "Borislav Petkov (AMD)" <bp@alien8.de> Cc: Byungchul Park <byungchul@sk.com> Cc: Catalin Marinas <catalin.marinas@arm.com> Cc: Christian Borntraeger <borntraeger@linux.ibm.com> Cc: Gregory Price <gourry@gourry.net> Cc: Heiko Carstens <hca@linux.ibm.com> Cc: "H. Peter Anvin" <hpa@zytor.com> Cc: Huacai Chen <chenhuacai@kernel.org> Cc: "Huang, Ying" <ying.huang@linux.alibaba.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: Joshua Hahn <joshua.hahnjy@gmail.com> Cc: Liam Howlett <liam.howlett@oracle.com> Cc: Madhavan Srinivasan <maddy@linux.ibm.com> Cc: Matthew Brost <matthew.brost@intel.com> Cc: Michael Ellerman <mpe@ellerman.id.au> Cc: Michal Hocko <mhocko@suse.com> Cc: Mike Rapoport <rppt@kernel.org> Cc: Nicholas Piggin <npiggin@gmail.com> Cc: Palmer Dabbelt <palmer@dabbelt.com> Cc: Rakie Kim <rakie.kim@sk.com> Cc: Sebastian Andrzej Siewior <bigeasy@linutronix.de> Cc: Steven Rostedt <rostedt@goodmis.org> Cc: Suren Baghdasaryan <surenb@google.com> Cc: Sven Schnelle <svens@linux.ibm.com> Cc: Vasily Gorbik <gor@linux.ibm.com> Cc: WANG Xuerui <kernel@xen0n.name> Cc: Will Deacon <will@kernel.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
156 lines
4.0 KiB
C
156 lines
4.0 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
#ifndef _LINUX_MEMORY_TIERS_H
|
|
#define _LINUX_MEMORY_TIERS_H
|
|
|
|
#include <linux/types.h>
|
|
#include <linux/nodemask.h>
|
|
#include <linux/kref.h>
|
|
#include <linux/mmzone.h>
|
|
#include <linux/notifier.h>
|
|
/*
|
|
* Each tier cover a abstrace distance chunk size of 128
|
|
*/
|
|
#define MEMTIER_CHUNK_BITS 7
|
|
#define MEMTIER_CHUNK_SIZE (1 << MEMTIER_CHUNK_BITS)
|
|
/*
|
|
* Smaller abstract distance values imply faster (higher) memory tiers. Offset
|
|
* the DRAM adistance so that we can accommodate devices with a slightly lower
|
|
* adistance value (slightly faster) than default DRAM adistance to be part of
|
|
* the same memory tier.
|
|
*/
|
|
#define MEMTIER_ADISTANCE_DRAM ((4L * MEMTIER_CHUNK_SIZE) + (MEMTIER_CHUNK_SIZE >> 1))
|
|
|
|
struct memory_tier;
|
|
struct memory_dev_type {
|
|
/* list of memory types that are part of same tier as this type */
|
|
struct list_head tier_sibling;
|
|
/* list of memory types that are managed by one driver */
|
|
struct list_head list;
|
|
/* abstract distance for this specific memory type */
|
|
int adistance;
|
|
/* Nodes of same abstract distance */
|
|
nodemask_t nodes;
|
|
struct kref kref;
|
|
};
|
|
|
|
struct access_coordinate;
|
|
|
|
#ifdef CONFIG_NUMA
|
|
extern bool numa_demotion_enabled;
|
|
extern struct memory_dev_type *default_dram_type;
|
|
extern nodemask_t default_dram_nodes;
|
|
struct memory_dev_type *alloc_memory_type(int adistance);
|
|
void put_memory_type(struct memory_dev_type *memtype);
|
|
void init_node_memory_type(int node, struct memory_dev_type *default_type);
|
|
void clear_node_memory_type(int node, struct memory_dev_type *memtype);
|
|
int register_mt_adistance_algorithm(struct notifier_block *nb);
|
|
int unregister_mt_adistance_algorithm(struct notifier_block *nb);
|
|
int mt_calc_adistance(int node, int *adist);
|
|
int mt_set_default_dram_perf(int nid, struct access_coordinate *perf,
|
|
const char *source);
|
|
int mt_perf_to_adistance(struct access_coordinate *perf, int *adist);
|
|
struct memory_dev_type *mt_find_alloc_memory_type(int adist,
|
|
struct list_head *memory_types);
|
|
void mt_put_memory_types(struct list_head *memory_types);
|
|
#ifdef CONFIG_NUMA_MIGRATION
|
|
int next_demotion_node(int node, const nodemask_t *allowed_mask);
|
|
void node_get_allowed_targets(pg_data_t *pgdat, nodemask_t *targets);
|
|
bool node_is_toptier(int node);
|
|
#else
|
|
static inline int next_demotion_node(int node, const nodemask_t *allowed_mask)
|
|
{
|
|
return NUMA_NO_NODE;
|
|
}
|
|
|
|
static inline void node_get_allowed_targets(pg_data_t *pgdat, nodemask_t *targets)
|
|
{
|
|
*targets = NODE_MASK_NONE;
|
|
}
|
|
|
|
static inline bool node_is_toptier(int node)
|
|
{
|
|
return true;
|
|
}
|
|
#endif
|
|
|
|
#else
|
|
|
|
#define numa_demotion_enabled false
|
|
#define default_dram_type NULL
|
|
#define default_dram_nodes NODE_MASK_NONE
|
|
/*
|
|
* CONFIG_NUMA implementation returns non NULL error.
|
|
*/
|
|
static inline struct memory_dev_type *alloc_memory_type(int adistance)
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
static inline void put_memory_type(struct memory_dev_type *memtype)
|
|
{
|
|
|
|
}
|
|
|
|
static inline void init_node_memory_type(int node, struct memory_dev_type *default_type)
|
|
{
|
|
|
|
}
|
|
|
|
static inline void clear_node_memory_type(int node, struct memory_dev_type *memtype)
|
|
{
|
|
|
|
}
|
|
|
|
static inline int next_demotion_node(int node, const nodemask_t *allowed_mask)
|
|
{
|
|
return NUMA_NO_NODE;
|
|
}
|
|
|
|
static inline void node_get_allowed_targets(pg_data_t *pgdat, nodemask_t *targets)
|
|
{
|
|
*targets = NODE_MASK_NONE;
|
|
}
|
|
|
|
static inline bool node_is_toptier(int node)
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static inline int register_mt_adistance_algorithm(struct notifier_block *nb)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int unregister_mt_adistance_algorithm(struct notifier_block *nb)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
static inline int mt_calc_adistance(int node, int *adist)
|
|
{
|
|
return NOTIFY_DONE;
|
|
}
|
|
|
|
static inline int mt_set_default_dram_perf(int nid, struct access_coordinate *perf,
|
|
const char *source)
|
|
{
|
|
return -EIO;
|
|
}
|
|
|
|
static inline int mt_perf_to_adistance(struct access_coordinate *perf, int *adist)
|
|
{
|
|
return -EIO;
|
|
}
|
|
|
|
static inline struct memory_dev_type *mt_find_alloc_memory_type(int adist,
|
|
struct list_head *memory_types)
|
|
{
|
|
return NULL;
|
|
}
|
|
|
|
static inline void mt_put_memory_types(struct list_head *memory_types)
|
|
{
|
|
}
|
|
#endif /* CONFIG_NUMA */
|
|
#endif /* _LINUX_MEMORY_TIERS_H */
|