mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-18 22:14:16 +00:00 
			
		
		
		
	 eb33575cf6
			
		
	
	
		eb33575cf6
		
	
	
	
	
		
			
			pfn_valid() is meant to be able to tell if a given PFN has valid memmap associated with it or not. In FLATMEM, it is expected that holes always have valid memmap as long as there is valid PFNs either side of the hole. In SPARSEMEM, it is assumed that a valid section has a memmap for the entire section. However, ARM and maybe other embedded architectures in the future free memmap backing holes to save memory on the assumption the memmap is never used. The page_zone linkages are then broken even though pfn_valid() returns true. A walker of the full memmap must then do this additional check to ensure the memmap they are looking at is sane by making sure the zone and PFN linkages are still valid. This is expensive, but walkers of the full memmap are extremely rare. This was caught before for FLATMEM and hacked around but it hits again for SPARSEMEM because the page_zone linkages can look ok where the PFN linkages are totally screwed. This looks like a hatchet job but the reality is that any clean solution would end up consumning all the memory saved by punching these unexpected holes in the memmap. For example, we tried marking the memmap within the section invalid but the section size exceeds the size of the hole in most cases so pfn_valid() starts returning false where valid memmap exists. Shrinking the size of the section would increase memory consumption offsetting the gains. This patch identifies when an architecture is punching unexpected holes in the memmap that the memory model cannot automatically detect and sets ARCH_HAS_HOLES_MEMORYMODEL. At the moment, this is restricted to EP93xx which is the model sub-architecture this has been reported on but may expand later. When set, walkers of the full memmap must call memmap_valid_within() for each PFN and passing in what it expects the page and zone to be for that PFN. If it finds the linkages to be broken, it assumes the memmap is invalid for that PFN. Signed-off-by: Mel Gorman <mel@csn.ul.ie> Signed-off-by: Russell King <rmk+kernel@arm.linux.org.uk>
		
			
				
	
	
		
			89 lines
		
	
	
	
		
			1.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			89 lines
		
	
	
	
		
			1.8 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * linux/mm/mmzone.c
 | |
|  *
 | |
|  * management codes for pgdats and zones.
 | |
|  */
 | |
| 
 | |
| 
 | |
| #include <linux/stddef.h>
 | |
| #include <linux/mm.h>
 | |
| #include <linux/mmzone.h>
 | |
| #include <linux/module.h>
 | |
| 
 | |
| struct pglist_data *first_online_pgdat(void)
 | |
| {
 | |
| 	return NODE_DATA(first_online_node);
 | |
| }
 | |
| 
 | |
| struct pglist_data *next_online_pgdat(struct pglist_data *pgdat)
 | |
| {
 | |
| 	int nid = next_online_node(pgdat->node_id);
 | |
| 
 | |
| 	if (nid == MAX_NUMNODES)
 | |
| 		return NULL;
 | |
| 	return NODE_DATA(nid);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * next_zone - helper magic for for_each_zone()
 | |
|  */
 | |
| struct zone *next_zone(struct zone *zone)
 | |
| {
 | |
| 	pg_data_t *pgdat = zone->zone_pgdat;
 | |
| 
 | |
| 	if (zone < pgdat->node_zones + MAX_NR_ZONES - 1)
 | |
| 		zone++;
 | |
| 	else {
 | |
| 		pgdat = next_online_pgdat(pgdat);
 | |
| 		if (pgdat)
 | |
| 			zone = pgdat->node_zones;
 | |
| 		else
 | |
| 			zone = NULL;
 | |
| 	}
 | |
| 	return zone;
 | |
| }
 | |
| 
 | |
| static inline int zref_in_nodemask(struct zoneref *zref, nodemask_t *nodes)
 | |
| {
 | |
| #ifdef CONFIG_NUMA
 | |
| 	return node_isset(zonelist_node_idx(zref), *nodes);
 | |
| #else
 | |
| 	return 1;
 | |
| #endif /* CONFIG_NUMA */
 | |
| }
 | |
| 
 | |
| /* Returns the next zone at or below highest_zoneidx in a zonelist */
 | |
| struct zoneref *next_zones_zonelist(struct zoneref *z,
 | |
| 					enum zone_type highest_zoneidx,
 | |
| 					nodemask_t *nodes,
 | |
| 					struct zone **zone)
 | |
| {
 | |
| 	/*
 | |
| 	 * Find the next suitable zone to use for the allocation.
 | |
| 	 * Only filter based on nodemask if it's set
 | |
| 	 */
 | |
| 	if (likely(nodes == NULL))
 | |
| 		while (zonelist_zone_idx(z) > highest_zoneidx)
 | |
| 			z++;
 | |
| 	else
 | |
| 		while (zonelist_zone_idx(z) > highest_zoneidx ||
 | |
| 				(z->zone && !zref_in_nodemask(z, nodes)))
 | |
| 			z++;
 | |
| 
 | |
| 	*zone = zonelist_zone(z);
 | |
| 	return z;
 | |
| }
 | |
| 
 | |
| #ifdef CONFIG_ARCH_HAS_HOLES_MEMORYMODEL
 | |
| int memmap_valid_within(unsigned long pfn,
 | |
| 					struct page *page, struct zone *zone)
 | |
| {
 | |
| 	if (page_to_pfn(page) != pfn)
 | |
| 		return 0;
 | |
| 
 | |
| 	if (page_zone(page) != zone)
 | |
| 		return 0;
 | |
| 
 | |
| 	return 1;
 | |
| }
 | |
| #endif /* CONFIG_ARCH_HAS_HOLES_MEMORYMODEL */
 |