* map_physical_memory() does now always set a memory type. If none is given (it

needs to be or'ed to the address specification), "uncached" is assumed.
* Set the memory type for the "BIOS" and "DMA" areas to write-back. Not sure, if
  that's correct, but that's what was effectively used on my machines before.
* Changed x86_set_mtrrs() and the CPU module hook to also set the default memory
  type.
* Rewrote the MTRR computation once more:
  - Now we know all used memory ranges, so we are free to extend used ranges
    into unused ones in order to simplify them for MTRR setup.
  - Leverage the subtractive properties of uncached and write-through ranges to
    simplify ranges of any other respectively write-back type.
  - Set the default memory type to write-back, so we don't need MTRRs for the
    RAM ranges.
  - If a new range intersects with an existing one, we no longer just fail.
    Instead we use the strictest requirements implied by the ranges. This fixes
    #5383.

Overall the new algorithm should be sufficient with far less MTRRs than before
(on my desktop machine 4 are used at maximum, while 8 didn't quite suffice
before). A drawback of the current implementation is that it doesn't deal with
the case of running out of MTRRs at all, which might result in some ranges
having weaker caching/memory ordering properties than requested.


git-svn-id: file:///srv/svn/repos/haiku/haiku/trunk@35515 a95241bf-73f2-0310-859d-f6bbb57e9c96
This commit is contained in:
Ingo Weinhold 2010-02-18 13:52:43 +00:00
parent e5b2296d48
commit dac21d8bfe
10 changed files with 463 additions and 423 deletions

View File

@ -124,7 +124,8 @@ typedef struct x86_cpu_module_info {
uint8 type); uint8 type);
status_t (*get_mtrr)(uint32 index, uint64* _base, uint64* _length, status_t (*get_mtrr)(uint32 index, uint64* _base, uint64* _length,
uint8* _type); uint8* _type);
void (*set_mtrrs)(const x86_mtrr_info* infos, uint32 count); void (*set_mtrrs)(uint8 defaultType, const x86_mtrr_info* infos,
uint32 count);
void (*get_optimized_functions)(x86_optimized_functions* functions); void (*get_optimized_functions)(x86_optimized_functions* functions);
} x86_cpu_module_info; } x86_cpu_module_info;
@ -290,7 +291,8 @@ uint32 x86_count_mtrrs(void);
void x86_set_mtrr(uint32 index, uint64 base, uint64 length, uint8 type); void x86_set_mtrr(uint32 index, uint64 base, uint64 length, uint8 type);
status_t x86_get_mtrr(uint32 index, uint64* _base, uint64* _length, status_t x86_get_mtrr(uint32 index, uint64* _base, uint64* _length,
uint8* _type); uint8* _type);
void x86_set_mtrrs(const x86_mtrr_info* infos, uint32 count); void x86_set_mtrrs(uint8 defaultType, const x86_mtrr_info* infos,
uint32 count);
bool x86_check_feature(uint32 feature, enum x86_feature_type type); bool x86_check_feature(uint32 feature, enum x86_feature_type type);
void* x86_get_double_fault_stack(int32 cpu, size_t* _size); void* x86_get_double_fault_stack(int32 cpu, size_t* _size);
int32 x86_double_fault_get_cpu(void); int32 x86_double_fault_get_cpu(void);

View File

@ -43,9 +43,9 @@ amd_init(void)
static void static void
amd_set_mtrrs(const x86_mtrr_info* infos, uint32 count) amd_set_mtrrs(uint8 defaultType, const x86_mtrr_info* infos, uint32 count)
{ {
generic_set_mtrrs(infos, count, generic_count_mtrrs()); generic_set_mtrrs(defaultType, infos, count, generic_count_mtrrs());
} }

View File

@ -173,7 +173,8 @@ generic_get_mtrr(uint32 index, uint64 *_base, uint64 *_length, uint8 *_type)
void void
generic_set_mtrrs(const x86_mtrr_info* infos, uint32 count, uint32 maxCount) generic_set_mtrrs(uint8 newDefaultType, const x86_mtrr_info* infos,
uint32 count, uint32 maxCount)
{ {
// check count // check count
if (maxCount == 0) if (maxCount == 0)
@ -195,7 +196,8 @@ generic_set_mtrrs(const x86_mtrr_info* infos, uint32 count, uint32 maxCount)
for (uint32 i = count; i < maxCount; i++) for (uint32 i = count; i < maxCount; i++)
set_mtrr(i, 0, 0, 0); set_mtrr(i, 0, 0, 0);
// re-enable MTTRs // re-enable MTTRs and set the new default type
defaultType = (defaultType & ~(uint64)0xff) | newDefaultType;
x86_write_msr(IA32_MSR_MTRR_DEFAULT_TYPE, defaultType | IA32_MTRR_ENABLE); x86_write_msr(IA32_MSR_MTRR_DEFAULT_TYPE, defaultType | IA32_MTRR_ENABLE);
} }

View File

@ -25,7 +25,8 @@ extern void generic_init_mtrrs(uint32 count);
extern void generic_set_mtrr(uint32 index, uint64 base, uint64 length, uint8 type); extern void generic_set_mtrr(uint32 index, uint64 base, uint64 length, uint8 type);
extern status_t generic_get_mtrr(uint32 index, uint64 *_base, uint64 *_length, extern status_t generic_get_mtrr(uint32 index, uint64 *_base, uint64 *_length,
uint8 *_type); uint8 *_type);
extern void generic_set_mtrrs(const struct x86_mtrr_info* infos, extern void generic_set_mtrrs(uint8 defaultType,
const struct x86_mtrr_info* infos,
uint32 count, uint32 maxCount); uint32 count, uint32 maxCount);
extern status_t generic_mtrr_compute_physical_mask(void); extern status_t generic_mtrr_compute_physical_mask(void);

View File

@ -38,9 +38,9 @@ intel_init(void)
static void static void
intel_set_mtrrs(const x86_mtrr_info* infos, uint32 count) intel_set_mtrrs(uint8 defaultType, const x86_mtrr_info* infos, uint32 count)
{ {
generic_set_mtrrs(infos, count, generic_count_mtrrs()); generic_set_mtrrs(defaultType, infos, count, generic_count_mtrrs());
} }

View File

@ -32,9 +32,9 @@ via_init_mtrrs(void)
static void static void
via_set_mtrrs(const x86_mtrr_info* infos, uint32 count) via_set_mtrrs(uint8 defaultType, const x86_mtrr_info* infos, uint32 count)
{ {
generic_set_mtrrs(infos, count, via_count_mtrrs()); generic_set_mtrrs(defaultType, infos, count, via_count_mtrrs());
} }

View File

@ -73,6 +73,7 @@ struct set_mtrr_parameter {
struct set_mtrrs_parameter { struct set_mtrrs_parameter {
const x86_mtrr_info* infos; const x86_mtrr_info* infos;
uint32 count; uint32 count;
uint8 defaultType;
}; };
@ -188,7 +189,8 @@ set_mtrrs(void* _parameter, int cpu)
disable_caches(); disable_caches();
sCpuModule->set_mtrrs(parameter->infos, parameter->count); sCpuModule->set_mtrrs(parameter->defaultType, parameter->infos,
parameter->count);
enable_caches(); enable_caches();
@ -248,9 +250,13 @@ x86_get_mtrr(uint32 index, uint64 *_base, uint64 *_length, uint8 *_type)
void void
x86_set_mtrrs(const x86_mtrr_info* infos, uint32 count) x86_set_mtrrs(uint8 defaultType, const x86_mtrr_info* infos, uint32 count)
{ {
if (sCpuModule == NULL)
return;
struct set_mtrrs_parameter parameter; struct set_mtrrs_parameter parameter;
parameter.defaultType = defaultType;
parameter.infos = infos; parameter.infos = infos;
parameter.count = count; parameter.count = count;

View File

@ -1,5 +1,5 @@
/* /*
* Copyright 2009, Ingo Weinhold, ingo_weinhold@gmx.de. * Copyright 2009-2010, Ingo Weinhold, ingo_weinhold@gmx.de.
* Copyright 2008, Jérôme Duval. * Copyright 2008, Jérôme Duval.
* Copyright 2002-2007, Axel Dörfler, axeld@pinc-software.de. * Copyright 2002-2007, Axel Dörfler, axeld@pinc-software.de.
* Distributed under the terms of the MIT License. * Distributed under the terms of the MIT License.
@ -12,6 +12,9 @@
#include <stdlib.h> #include <stdlib.h>
#include <string.h> #include <string.h>
#include <algorithm>
#include <new>
#include <KernelExport.h> #include <KernelExport.h>
#include <smp.h> #include <smp.h>
@ -38,37 +41,26 @@
# define TRACE(x) ; # define TRACE(x) ;
#endif #endif
#define TRACE_MTRR_ARCH_VM // 0: disabled, 1: some, 2: more
#ifdef TRACE_MTRR_ARCH_VM #define TRACE_MTRR_ARCH_VM 1
#if TRACE_MTRR_ARCH_VM >= 1
# define TRACE_MTRR(x...) dprintf(x) # define TRACE_MTRR(x...) dprintf(x)
#else #else
# define TRACE_MTRR(x...) # define TRACE_MTRR(x...)
#endif #endif
#if TRACE_MTRR_ARCH_VM >= 2
static const uint32 kMaxMemoryTypeRanges = 32; # define TRACE_MTRR2(x...) dprintf(x)
static const uint32 kMaxMemoryTypeRegisters = 32; #else
static const uint64 kMinMemoryTypeRangeSize = 1 << 12; # define TRACE_MTRR2(x...)
#endif
struct memory_type_range_analysis_info { void *gDmaAddress;
uint64 size;
uint32 rangesNeeded;
uint32 subtractiveRangesNeeded;
uint64 bestSubtractiveRange;
};
struct memory_type_range_analysis {
uint64 base;
uint64 size;
uint32 type;
uint32 rangesNeeded;
uint64 endRange;
memory_type_range_analysis_info left;
memory_type_range_analysis_info right;
};
struct memory_type_range { struct memory_type_range : DoublyLinkedListLinkImpl<memory_type_range> {
uint64 base; uint64 base;
uint64 size; uint64 size;
uint32 type; uint32 type;
@ -76,306 +68,404 @@ struct memory_type_range {
}; };
void *gDmaAddress; struct memory_type_range_point
: DoublyLinkedListLinkImpl<memory_type_range_point> {
uint64 address;
memory_type_range* range;
static memory_type_range sMemoryTypeRanges[kMaxMemoryTypeRanges]; bool IsStart() const { return range->base == address; }
static uint32 sMemoryTypeRangeCount;
static memory_type_range_analysis sMemoryTypeRangeAnalysis[ bool operator<(const memory_type_range_point& other) const
kMaxMemoryTypeRanges]; {
return address < other.address;
}
};
typedef DoublyLinkedList<memory_type_range> MemoryTypeRangeList;
static mutex sMemoryTypeLock = MUTEX_INITIALIZER("memory type ranges");
static MemoryTypeRangeList sMemoryTypeRanges;
static int32 sMemoryTypeRangeCount = 0;
static const uint32 kMaxMemoryTypeRegisters = 32;
static x86_mtrr_info sMemoryTypeRegisters[kMaxMemoryTypeRegisters]; static x86_mtrr_info sMemoryTypeRegisters[kMaxMemoryTypeRegisters];
static uint32 sMemoryTypeRegisterCount; static uint32 sMemoryTypeRegisterCount;
static uint32 sMemoryTypeRegistersUsed; static uint32 sMemoryTypeRegistersUsed;
static mutex sMemoryTypeLock = MUTEX_INITIALIZER("memory type ranges"); static memory_type_range* sTemporaryRanges = NULL;
static memory_type_range_point* sTemporaryRangePoints = NULL;
static int32 sTemporaryRangeCount = 0;
static int32 sTemporaryRangePointCount = 0;
static void static void
set_mtrrs() set_mtrrs()
{ {
x86_set_mtrrs(sMemoryTypeRegisters, sMemoryTypeRegistersUsed); x86_set_mtrrs(IA32_MTR_WRITE_BACK, sMemoryTypeRegisters,
sMemoryTypeRegistersUsed);
#ifdef TRACE_MTRR_ARCH_VM #if TRACE_MTRR_ARCH_VM
TRACE_MTRR("set MTRRs to:\n"); TRACE_MTRR("set MTRRs to:\n");
for (uint32 i = 0; i < sMemoryTypeRegistersUsed; i++) { for (uint32 i = 0; i < sMemoryTypeRegistersUsed; i++) {
const x86_mtrr_info& info = sMemoryTypeRegisters[i]; const x86_mtrr_info& info = sMemoryTypeRegisters[i];
TRACE_MTRR(" mtrr: %2lu: base: %#9llx, size: %#9llx, type: %u\n", TRACE_MTRR(" mtrr: %2" B_PRIu32 ": base: %#10" B_PRIx64 ", size: %#10"
i, info.base, info.size, info.type); B_PRIx64 ", type: %u\n", i, info.base, info.size,
info.type);
} }
#endif #endif
} }
static void static bool
add_used_mtrr(uint64 base, uint64 size, uint32 type) add_used_mtrr(uint64 base, uint64 size, uint32 type)
{ {
ASSERT(sMemoryTypeRegistersUsed < sMemoryTypeRegisterCount); if (sMemoryTypeRegistersUsed == sMemoryTypeRegisterCount) {
dprintf("add_used_mtrr(%#" B_PRIx64 ", %#" B_PRIx64 ", %" B_PRIu32
"): out of MTRRs!\n", base, size, type);
return false;
}
x86_mtrr_info& info = sMemoryTypeRegisters[sMemoryTypeRegistersUsed++]; x86_mtrr_info& mtrr = sMemoryTypeRegisters[sMemoryTypeRegistersUsed++];
info.base = base; mtrr.base = base;
info.size = size; mtrr.size = size;
info.type = type; mtrr.type = type;
return true;
}
static bool
add_mtrrs_for_range(uint64 base, uint64 size, uint32 type)
{
for (uint64 interval = B_PAGE_SIZE; size > 0; interval <<= 1) {
if (((base | size) & interval) != 0) {
if ((base & interval) != 0) {
if (!add_used_mtrr(base, interval, type))
return false;
base += interval;
} else {
if (!add_used_mtrr(base + size - interval, interval, type))
return false;
}
size -= interval;
}
}
return true;
}
static memory_type_range*
find_range(area_id areaID)
{
for (MemoryTypeRangeList::Iterator it = sMemoryTypeRanges.GetIterator();
memory_type_range* range = it.Next();) {
if (range->area == areaID)
return range;
}
return NULL;
} }
static void static void
analyze_range(memory_type_range_analysis& analysis, uint64 previousEnd, optimize_memory_ranges(MemoryTypeRangeList& ranges, uint32 type,
uint64 nextBase) bool removeRanges)
{ {
uint64 base = analysis.base;
uint64 size = analysis.size;
memory_type_range_analysis_info& left = analysis.left;
memory_type_range_analysis_info& right = analysis.right;
uint32 leftSubtractiveRangesNeeded = 2;
int32 leftBestSubtractiveRangeDifference = 0;
uint32 leftBestSubtractivePositiveRangesNeeded = 0;
uint32 leftBestSubtractiveRangesNeeded = 0;
uint32 rightSubtractiveRangesNeeded = 2;
int32 rightBestSubtractiveRangeDifference = 0;
uint32 rightBestSubtractivePositiveRangesNeeded = 0;
uint32 rightBestSubtractiveRangesNeeded = 0;
uint64 range = kMinMemoryTypeRangeSize;
while (size > 0) {
if ((base & range) != 0) {
left.rangesNeeded++;
bool replaceBestSubtractive = false;
int32 rangeDifference = (int32)left.rangesNeeded
- (int32)leftSubtractiveRangesNeeded;
if (left.bestSubtractiveRange == 0
|| leftBestSubtractiveRangeDifference < rangeDifference) {
// check for intersection with previous range
replaceBestSubtractive
= previousEnd == 0 || base - range >= previousEnd;
}
if (replaceBestSubtractive) {
leftBestSubtractiveRangeDifference = rangeDifference;
leftBestSubtractiveRangesNeeded
= leftSubtractiveRangesNeeded;
left.bestSubtractiveRange = range;
leftBestSubtractivePositiveRangesNeeded = 0;
} else
leftBestSubtractivePositiveRangesNeeded++;
left.size += range;
base += range;
size -= range;
} else if (left.bestSubtractiveRange > 0)
leftSubtractiveRangesNeeded++;
if ((size & range) != 0) {
right.rangesNeeded++;
bool replaceBestSubtractive = false;
int32 rangeDifference = (int32)right.rangesNeeded
- (int32)rightSubtractiveRangesNeeded;
if (right.bestSubtractiveRange == 0
|| rightBestSubtractiveRangeDifference < rangeDifference) {
// check for intersection with previous range
replaceBestSubtractive
= nextBase == 0 || base + size + range <= nextBase;
}
if (replaceBestSubtractive) {
rightBestSubtractiveRangeDifference = rangeDifference;
rightBestSubtractiveRangesNeeded
= rightSubtractiveRangesNeeded;
right.bestSubtractiveRange = range;
rightBestSubtractivePositiveRangesNeeded = 0;
} else
rightBestSubtractivePositiveRangesNeeded++;
right.size += range;
size -= range;
} else if (right.bestSubtractiveRange > 0)
rightSubtractiveRangesNeeded++;
range <<= 1;
}
analysis.endRange = range;
// If a subtractive setup doesn't have any advantages, don't use it.
// Also compute analysis.rangesNeeded.
if (leftBestSubtractiveRangesNeeded
+ leftBestSubtractivePositiveRangesNeeded >= left.rangesNeeded) {
left.bestSubtractiveRange = 0;
left.subtractiveRangesNeeded = 0;
analysis.rangesNeeded = left.rangesNeeded;
} else {
left.subtractiveRangesNeeded = leftBestSubtractiveRangesNeeded
+ leftBestSubtractivePositiveRangesNeeded;
analysis.rangesNeeded = left.subtractiveRangesNeeded;
}
if (rightBestSubtractiveRangesNeeded
+ rightBestSubtractivePositiveRangesNeeded >= right.rangesNeeded) {
right.bestSubtractiveRange = 0;
right.subtractiveRangesNeeded = 0;
analysis.rangesNeeded += right.rangesNeeded;
} else {
right.subtractiveRangesNeeded = rightBestSubtractiveRangesNeeded
+ rightBestSubtractivePositiveRangesNeeded;
analysis.rangesNeeded += right.subtractiveRangesNeeded;
}
}
static void
compute_mtrrs(const memory_type_range_analysis& analysis)
{
const memory_type_range_analysis_info& left = analysis.left;
const memory_type_range_analysis_info& right = analysis.right;
// generate a setup for the left side
if (left.rangesNeeded > 0) {
uint64 base = analysis.base;
uint64 size = left.size;
uint64 range = analysis.endRange;
uint64 rangeEnd = base + size;
bool subtractive = false;
while (size > 0) {
if (range == left.bestSubtractiveRange) {
base = rangeEnd - 2 * range;
add_used_mtrr(base, range, analysis.type);
subtractive = true;
break;
}
if ((size & range) != 0) {
rangeEnd -= range;
add_used_mtrr(rangeEnd, range, analysis.type);
size -= range;
}
range >>= 1;
}
if (subtractive) {
uint64 shortestRange = range;
while (size > 0) {
if ((size & range) != 0) {
shortestRange = range;
size -= range;
} else {
add_used_mtrr(base, range, IA32_MTR_UNCACHED);
base += range;
}
range >>= 1;
}
add_used_mtrr(base, shortestRange, IA32_MTR_UNCACHED);
}
}
// generate a setup for the right side
if (right.rangesNeeded > 0) {
uint64 base = analysis.base + left.size;
uint64 size = right.size;
uint64 range = analysis.endRange;
bool subtractive = false;
while (size > 0) {
if (range == right.bestSubtractiveRange) {
add_used_mtrr(base, range * 2, analysis.type);
subtractive = true;
break;
}
if ((size & range) != 0) {
add_used_mtrr(base, range, analysis.type);
base += range;
size -= range;
}
range >>= 1;
}
if (subtractive) {
uint64 rangeEnd = base + range * 2;
uint64 shortestRange = range;
while (size > 0) {
if ((size & range) != 0) {
shortestRange = range;
size -= range;
} else {
rangeEnd -= range;
add_used_mtrr(rangeEnd, range, IA32_MTR_UNCACHED);
}
range >>= 1;
}
rangeEnd -= shortestRange;
add_used_mtrr(rangeEnd, shortestRange, IA32_MTR_UNCACHED);
}
}
}
static status_t
update_mttrs()
{
// Transfer the range array to the analysis array, dropping all uncachable
// ranges (that's the default anyway) and joining adjacent ranges with the
// same type.
memory_type_range_analysis* ranges = sMemoryTypeRangeAnalysis;
uint32 rangeCount = 0;
{
uint32 previousRangeType = IA32_MTR_UNCACHED;
uint64 previousRangeEnd = 0;
for (uint32 i = 0; i < sMemoryTypeRangeCount; i++) {
if (sMemoryTypeRanges[i].type != IA32_MTR_UNCACHED) {
uint64 rangeEnd = sMemoryTypeRanges[i].base
+ sMemoryTypeRanges[i].size;
if (previousRangeType == sMemoryTypeRanges[i].type
&& previousRangeEnd >= sMemoryTypeRanges[i].base) {
// the range overlaps/continues the previous range -- just
// enlarge that one
if (rangeEnd > previousRangeEnd)
previousRangeEnd = rangeEnd;
ranges[rangeCount - 1].size = previousRangeEnd
- ranges[rangeCount - 1].base;
} else {
// add the new range
memset(&ranges[rangeCount], 0, sizeof(ranges[rangeCount]));
ranges[rangeCount].base = sMemoryTypeRanges[i].base;
ranges[rangeCount].size = sMemoryTypeRanges[i].size;
ranges[rangeCount].type = sMemoryTypeRanges[i].type;
previousRangeEnd = rangeEnd;
previousRangeType = sMemoryTypeRanges[i].type;
rangeCount++;
}
}
}
}
// analyze the ranges
uint32 registersNeeded = 0;
uint64 previousEnd = 0; uint64 previousEnd = 0;
for (uint32 i = 0; i < rangeCount; i++) { uint64 nextStart = 0;
memory_type_range_analysis& range = ranges[i]; MemoryTypeRangeList::Iterator it = ranges.GetIterator();
uint64 nextBase = i + 1 < rangeCount ? ranges[i + 1].base : 0; memory_type_range* range = it.Next();
analyze_range(range, previousEnd, nextBase); while (range != NULL) {
registersNeeded += range.rangesNeeded; if (range->type != type) {
previousEnd = range.base + range.size; previousEnd = range->base + range->size;
nextStart = 0;
range = it.Next();
continue;
}
// find the start of the next range we cannot join this one with
if (nextStart == 0) {
MemoryTypeRangeList::Iterator nextIt = it;
while (memory_type_range* nextRange = nextIt.Next()) {
if (nextRange->type != range->type) {
nextStart = nextRange->base;
break;
}
}
if (nextStart == 0) {
// no upper limit -- set an artificial one, so we don't need to
// special case below
nextStart = (uint64)1 << 32;
}
}
// Align the range's base and end to the greatest power of two possible.
// As long as we can align both without intersecting any differently
// range, we can extend the range without making it more complicated.
// Once one side hit a limit we need to be careful. We can still
// continue aligning the other side, if the range crosses the power of
// two boundary.
uint64 rangeBase = range->base;
uint64 rangeEnd = rangeBase + range->size;
uint64 interval = B_PAGE_SIZE * 2;
while (true) {
uint64 alignedBase = rangeBase & ~(interval - 1);
uint64 alignedEnd = (rangeEnd + interval - 1) & ~(interval - 1);
if (alignedBase < previousEnd)
alignedBase += interval;
if (alignedEnd > nextStart)
alignedEnd -= interval;
if (alignedBase >= alignedEnd)
break;
rangeBase = std::min(rangeBase, alignedBase);
rangeEnd = std::max(rangeEnd, alignedEnd);
interval <<= 1;
}
range->base = rangeBase;
range->size = rangeEnd - rangeBase;
if (removeRanges)
it.Remove();
previousEnd = rangeEnd;
// Skip the subsequent ranges we have swallowed and possible cut one
// we now partially intersect with.
while ((range = it.Next()) != NULL) {
if (range->base >= rangeEnd)
break;
if (range->base + range->size > rangeEnd) {
// we partially intersect -- cut the range
range->size = range->base + range->size - rangeEnd;
range->base = rangeEnd;
break;
}
// we have swallowed this range completely
range->size = 0;
it.Remove();
}
}
}
static bool
ensure_temporary_ranges_space(int32 count)
{
if (sTemporaryRangeCount >= count && sTemporaryRangePointCount >= count)
return true;
// round count to power of 2
int32 unalignedCount = count;
count = 8;
while (count < unalignedCount)
count <<= 1;
// resize ranges array
if (sTemporaryRangeCount < count) {
memory_type_range* ranges = new(std::nothrow) memory_type_range[count];
if (ranges == NULL)
return false;
delete[] sTemporaryRanges;
sTemporaryRanges = ranges;
sTemporaryRangeCount = count;
} }
// fail when we need more registers than we have // resize points array
if (registersNeeded > sMemoryTypeRegisterCount) if (sTemporaryRangePointCount < count) {
return B_BUSY; memory_type_range_point* points
= new(std::nothrow) memory_type_range_point[count];
if (points == NULL)
return false;
delete[] sTemporaryRangePoints;
sTemporaryRangePoints = points;
sTemporaryRangePointCount = count;
}
return true;
}
status_t
update_mtrrs()
{
// resize the temporary points/ranges arrays, if necessary
if (!ensure_temporary_ranges_space(sMemoryTypeRangeCount * 2))
return B_NO_MEMORY;
// get the range points and sort them
memory_type_range_point* rangePoints = sTemporaryRangePoints;
int32 pointCount = 0;
for (MemoryTypeRangeList::Iterator it = sMemoryTypeRanges.GetIterator();
memory_type_range* range = it.Next();) {
rangePoints[pointCount].address = range->base;
rangePoints[pointCount++].range = range;
rangePoints[pointCount].address = range->base + range->size;
rangePoints[pointCount++].range = range;
}
std::sort(rangePoints, rangePoints + pointCount);
#if TRACE_MTRR_ARCH_VM >= 2
TRACE_MTRR2("memory type range points:\n");
for (int32 i = 0; i < pointCount; i++) {
TRACE_MTRR2("%12" B_PRIx64 " (%p)\n", rangePoints[i].address,
rangePoints[i].range);
}
#endif
// Compute the effective ranges. When ranges overlap, we go with the
// stricter requirement. The types are not necessarily totally ordered, so
// the order we use below is not always correct. To keep it simple we
// consider it the reponsibility of the callers not to define overlapping
// memory ranges with uncomparable types.
memory_type_range* ranges = sTemporaryRanges;
typedef DoublyLinkedList<memory_type_range_point> PointList;
PointList pendingPoints;
memory_type_range* activeRange = NULL;
int32 rangeCount = 0;
for (int32 i = 0; i < pointCount; i++) {
memory_type_range_point* point = &rangePoints[i];
bool terminateRange = false;
if (point->IsStart()) {
// a range start point
pendingPoints.Add(point);
if (activeRange != NULL && activeRange->type > point->range->type)
terminateRange = true;
} else {
// a range end point -- remove the pending start point
for (PointList::Iterator it = pendingPoints.GetIterator();
memory_type_range_point* pendingPoint = it.Next();) {
if (pendingPoint->range == point->range) {
it.Remove();
break;
}
}
if (point->range == activeRange)
terminateRange = true;
}
if (terminateRange) {
ranges[rangeCount].size = point->address - ranges[rangeCount].base;
rangeCount++;
activeRange = NULL;
}
if (activeRange != NULL || pendingPoints.IsEmpty())
continue;
// we need to start a new range -- find the strictest pending range
for (PointList::Iterator it = pendingPoints.GetIterator();
memory_type_range_point* pendingPoint = it.Next();) {
memory_type_range* pendingRange = pendingPoint->range;
if (activeRange == NULL || activeRange->type > pendingRange->type)
activeRange = pendingRange;
}
memory_type_range* previousRange = rangeCount > 0
? &ranges[rangeCount - 1] : NULL;
if (previousRange == NULL || previousRange->type != activeRange->type
|| previousRange->base + previousRange->size
< activeRange->base) {
// we can't join with the previous range -- add a new one
ranges[rangeCount].base = point->address;
ranges[rangeCount].type = activeRange->type;
} else
rangeCount--;
}
#if TRACE_MTRR_ARCH_VM >= 2
TRACE_MTRR2("effective memory type ranges:\n");
for (int32 i = 0; i < rangeCount; i++) {
TRACE_MTRR2("%12" B_PRIx64 " - %12" B_PRIx64 ": %" B_PRIu32 "\n",
ranges[i].base, ranges[i].base + ranges[i].size, ranges[i].type);
}
#endif
// Extend ranges to be more MTRR-friendly. A range is MTRR friendly, when it
// has a power of two size and a base address aligned to the size. For
// ranges without this property we need more than one MTRR. We improve
// MTRR-friendliness by aligning a range's base and end address to the
// greatest power of two (base rounded down, end up) such that the extended
// range does not intersect with any other differently typed range. We join
// equally typed ranges, if possible. There are two exceptions to the
// intersection requirement: Uncached ranges may intersect with any other
// range; the resulting type will still be uncached. Hence we can ignore
// uncached ranges when extending the other ranges. Write-through range may
// intersect with write-back ranges; the resulting type will be
// write-through. Hence we can ignore write-through ranges when extending
// write-back ranges.
MemoryTypeRangeList rangeList;
for (int32 i = 0; i < rangeCount; i++)
rangeList.Add(&ranges[i]);
static const uint32 kMemoryTypes[] = {
IA32_MTR_UNCACHED,
IA32_MTR_WRITE_COMBINING,
IA32_MTR_WRITE_PROTECTED,
IA32_MTR_WRITE_THROUGH,
IA32_MTR_WRITE_BACK
};
static const int32 kMemoryTypeCount = sizeof(kMemoryTypes)
/ sizeof(*kMemoryTypes);
for (int32 i = 0; i < kMemoryTypeCount; i++) {
uint32 type = kMemoryTypes[i];
// Remove uncached and write-through ranges after processing them. This
// let's us leverage their intersection property with any other
// respectively write-back ranges.
bool removeRanges = type == IA32_MTR_UNCACHED
|| type == IA32_MTR_WRITE_THROUGH;
optimize_memory_ranges(rangeList, type, removeRanges);
}
#if TRACE_MTRR_ARCH_VM >= 2
TRACE_MTRR2("optimized memory type ranges:\n");
for (int32 i = 0; i < rangeCount; i++) {
if (ranges[i].size > 0) {
TRACE_MTRR2("%12" B_PRIx64 " - %12" B_PRIx64 ": %" B_PRIu32 "\n",
ranges[i].base, ranges[i].base + ranges[i].size,
ranges[i].type);
}
}
#endif
// compute the mtrrs from the ranges
sMemoryTypeRegistersUsed = 0; sMemoryTypeRegistersUsed = 0;
for (int32 i = 0; i < kMemoryTypeCount; i++) {
uint32 type = kMemoryTypes[i];
for (uint32 i = 0; i < rangeCount; i++) { // skip write-back ranges -- that'll be the default type anyway
memory_type_range_analysis& range = ranges[i]; if (type == IA32_MTR_WRITE_BACK)
compute_mtrrs(range); continue;
for (int32 i = 0; i < rangeCount; i++) {
if (ranges[i].size == 0 || ranges[i].type != type)
continue;
add_mtrrs_for_range(ranges[i].base, ranges[i].size, type);
}
} }
set_mtrrs(); set_mtrrs();
@ -384,17 +474,6 @@ update_mttrs()
} }
static void
remove_memory_type_range_locked(uint32 index)
{
sMemoryTypeRangeCount--;
if (index < sMemoryTypeRangeCount) {
memmove(sMemoryTypeRanges + index, sMemoryTypeRanges + index + 1,
(sMemoryTypeRangeCount - index) * sizeof(memory_type_range));
}
}
static status_t static status_t
add_memory_type_range(area_id areaID, uint64 base, uint64 size, uint32 type) add_memory_type_range(area_id areaID, uint64 base, uint64 size, uint32 type)
{ {
@ -422,105 +501,49 @@ add_memory_type_range(area_id areaID, uint64 base, uint64 size, uint32 type)
return B_BAD_VALUE; return B_BAD_VALUE;
} }
TRACE_MTRR("add_memory_type_range(%ld, %#llx, %#llx, %lu)\n", areaID, base, TRACE_MTRR("add_memory_type_range(%" B_PRId32 ", %#" B_PRIx64 ", %#"
size, type); B_PRIx64 ", %" B_PRIu32 ")\n", areaID, base, size, type);
// base and size must at least be aligned to the minimum range size
if (((base | size) & (kMinMemoryTypeRangeSize - 1)) != 0) {
dprintf("add_memory_type_range(%ld, %#llx, %#llx, %lu): Memory base or "
"size not minimally aligned!\n", areaID, base, size, type);
return B_BAD_VALUE;
}
MutexLocker locker(sMemoryTypeLock); MutexLocker locker(sMemoryTypeLock);
if (sMemoryTypeRangeCount == kMaxMemoryTypeRanges) { memory_type_range* range = areaID >= 0 ? find_range(areaID) : NULL;
dprintf("add_memory_type_range(%ld, %#llx, %#llx, %lu): Out of " int32 oldRangeType = -1;
"memory ranges!\n", areaID, base, size, type); if (range != NULL) {
return B_BUSY; if (range->base != base || range->size != size)
}
// iterate through the existing ranges and check for clashes
bool foundInsertionIndex = false;
uint32 index = 0;
for (uint32 i = 0; i < sMemoryTypeRangeCount; i++) {
const memory_type_range& range = sMemoryTypeRanges[i];
if (range.base > base) {
if (range.base - base < size && range.type != type) {
dprintf("add_memory_type_range(%ld, %#llx, %#llx, %lu): Memory "
"range intersects with existing one (%#llx, %#llx, %lu).\n",
areaID, base, size, type, range.base, range.size,
range.type);
return B_BAD_VALUE;
}
// found the insertion index
if (!foundInsertionIndex) {
index = i;
foundInsertionIndex = true;
}
break;
} else if (base - range.base < range.size && range.type != type) {
dprintf("add_memory_type_range(%ld, %#llx, %#llx, %lu): Memory "
"range intersects with existing one (%#llx, %#llx, %lu).\n",
areaID, base, size, type, range.base, range.size, range.type);
return B_BAD_VALUE; return B_BAD_VALUE;
} if (range->type == type)
}
if (!foundInsertionIndex)
index = sMemoryTypeRangeCount;
// make room for the new range
if (index < sMemoryTypeRangeCount) {
memmove(sMemoryTypeRanges + index + 1, sMemoryTypeRanges + index,
(sMemoryTypeRangeCount - index) * sizeof(memory_type_range));
}
sMemoryTypeRangeCount++;
memory_type_range& rangeInfo = sMemoryTypeRanges[index];
rangeInfo.base = base;
rangeInfo.size = size;
rangeInfo.type = type;
rangeInfo.area = areaID;
uint64 range = kMinMemoryTypeRangeSize;
status_t error;
do {
error = update_mttrs();
if (error == B_OK) {
if (rangeInfo.size != size) {
dprintf("add_memory_type_range(%ld, %#llx, %#llx, %lu): "
"update_mtrrs() succeeded only with simplified range: "
"base: %#llx, size: %#llx\n", areaID, base, size, type,
rangeInfo.base, rangeInfo.size);
}
return B_OK; return B_OK;
}
// update_mttrs() failed -- try to simplify (i.e. shrink) the range oldRangeType = range->type;
while (rangeInfo.size != 0) { range->type = type;
if ((rangeInfo.base & range) != 0) { } else {
rangeInfo.base += range; range = new(std::nothrow) memory_type_range;
rangeInfo.size -= range; if (range == NULL)
// don't shift the range yet -- we might still have an return B_NO_MEMORY;
// unaligned size
break;
}
if ((rangeInfo.size & range) != 0) {
rangeInfo.size -= range;
range <<= 1;
break;
}
range <<= 1; range->area = areaID;
} range->base = base;
} while (rangeInfo.size > 0); range->size = size;
range->type = type;
sMemoryTypeRanges.Add(range);
sMemoryTypeRangeCount++;
}
dprintf("add_memory_type_range(%ld, %#llx, %#llx, %lu): update_mtrrs() " status_t error = update_mtrrs();
"failed.\n", areaID, base, size, type); if (error != B_OK) {
remove_memory_type_range_locked(index); // revert the addition of the range/change of its type
return error; if (oldRangeType < 0) {
sMemoryTypeRanges.Remove(range);
sMemoryTypeRangeCount--;
delete range;
} else
range->type = oldRangeType;
update_mtrrs();
return error;
}
return B_OK;
} }
@ -529,18 +552,20 @@ remove_memory_type_range(area_id areaID)
{ {
MutexLocker locker(sMemoryTypeLock); MutexLocker locker(sMemoryTypeLock);
for (uint32 i = 0; i < sMemoryTypeRangeCount; i++) { memory_type_range* range = find_range(areaID);
if (sMemoryTypeRanges[i].area == areaID) { if (range != NULL) {
TRACE_MTRR("remove_memory_type_range(%ld, %#llx, %#llxd)\n", TRACE_MTRR("remove_memory_type_range(%" B_PRId32 ", %#" B_PRIx64 ", %#"
areaID, sMemoryTypeRanges[i].base, sMemoryTypeRanges[i].size); B_PRIx64 ", %" B_PRIu32 ")\n", range->area, range->base,
remove_memory_type_range_locked(i); range->size, range->type);
update_mttrs();
// TODO: It's actually possible that this call fails, since sMemoryTypeRanges.Remove(range);
// compute_mtrrs() joins ranges and removing one might cause a sMemoryTypeRangeCount--;
// previously joined big simple range to be split into several delete range;
// ranges (or just make it more complicated).
return; update_mtrrs();
} } else {
dprintf("remove_memory_type_range(): no range known for area %" B_PRId32
"\n", areaID);
} }
} }
@ -569,8 +594,8 @@ arch_vm_init_post_area(kernel_args *args)
// map 0 - 0xa0000 directly // map 0 - 0xa0000 directly
id = map_physical_memory("dma_region", (void *)0x0, 0xa0000, id = map_physical_memory("dma_region", (void *)0x0, 0xa0000,
B_ANY_KERNEL_ADDRESS, B_KERNEL_READ_AREA | B_KERNEL_WRITE_AREA, B_ANY_KERNEL_ADDRESS | B_MTR_WB,
&gDmaAddress); B_KERNEL_READ_AREA | B_KERNEL_WRITE_AREA, &gDmaAddress);
if (id < 0) { if (id < 0) {
panic("arch_vm_init_post_area: unable to map dma region\n"); panic("arch_vm_init_post_area: unable to map dma region\n");
return B_NO_MEMORY; return B_NO_MEMORY;

View File

@ -121,7 +121,8 @@ bios_init(void)
{ {
// map BIOS area 0xe0000 - 0xfffff // map BIOS area 0xe0000 - 0xfffff
area_id biosArea = map_physical_memory("pc bios", (void *)0xe0000, 0x20000, area_id biosArea = map_physical_memory("pc bios", (void *)0xe0000, 0x20000,
B_ANY_KERNEL_ADDRESS, B_KERNEL_READ_AREA | B_KERNEL_WRITE_AREA, (void **)&gBiosBase); B_ANY_KERNEL_ADDRESS | B_MTR_WB,
B_KERNEL_READ_AREA | B_KERNEL_WRITE_AREA, (void **)&gBiosBase);
if (biosArea < 0) if (biosArea < 0)
return biosArea; return biosArea;

View File

@ -1312,11 +1312,14 @@ vm_map_physical_memory(team_id team, const char* name, void** _address,
cache->Unlock(); cache->Unlock();
if (status >= B_OK && (addressSpec & B_MTR_MASK) != 0) { if (status == B_OK) {
// set requested memory type // set requested memory type -- use uncached, if not given
status = arch_vm_set_memory_type(area, physicalAddress, uint32 memoryType = addressSpec & B_MTR_MASK;
addressSpec & B_MTR_MASK); if (memoryType == 0)
if (status < B_OK) memoryType = B_MTR_UC;
status = arch_vm_set_memory_type(area, physicalAddress, memoryType);
if (status != B_OK)
delete_area(locker.AddressSpace(), area, false); delete_area(locker.AddressSpace(), area, false);
} }