 e94f856b38
			
		
	
	
		e94f856b38
		
	
	
	
	
		
			
			This patch employs one solution to resolve two independent but related
issues.  Both issues are the result of one fundamental aspect of the
way VM's memory mapping works: VM uses its cache to map in blocks for
memory-mapped file regions, and for blocks already in the VM cache, VM
does not go to the file system before mapping them in.  To preserve
consistency between the FS and VM caches, VM relies on being informed
about all updates to file contents through the block cache.  The two
issues are both the result of VM not being properly informed about
such updates:
 1. Once a file system provides libminixfs with an inode association
    (inode number + inode offset) for a disk block, this association
    is not broken until a new inode association is provided for it.
    If a block is freed and reallocated as a metadata (non-inode)
    block, its old association is maintained, and may be supplied to
    VM's secondary cache.  Due to reuse of inodes, it is possible
    that the same inode association becomes valid for an actual file
    block again.  In that case, when that new file is memory-mapped,
    under certain circumstances, VM may end up using the metadata
    block to satisfy a page fault on the file, due to the stale inode
    association.  The result is a corrupted memory mapping, with the
    application seeing data other than the current file contents
    mapped in at the file block.
 2. When a hole is created in a file, the underlying block is freed
    from the device, but VM is not informed of this update, and thus,
    if VM's cache contains the block with its previous inode
    association, this block will remain there.  As a result, if an
    application subsequently memory-maps the file, VM will map in the
    old block at the position of the hole, rather than an all-zeroes
    block.  Thus, again, the result is a corrupted memory mapping.
This patch resolves both issues by making the file system inform the
minixfs library about blocks being freed, so that libminixfs can
break the inode association for that block, both in its own cache and
in the VM cache.  Since libminixfs does not know whether VM has the
block in its cache or not, it makes a call to VM for each block being
freed.  Thus, this change introduces more calls to VM, but it solves
the correctness issues at hand; optimizations may be introduced
later.  On the upside, all freed blocks are now marked as clean,
which should result in fewer blocks being written back to the device,
and the blocks are removed from the caches entirely, which should
result in slightly better cache usage.
This patch is necessary but not sufficient to resolve the situation
with respect to memory mapping of file holes in general.  Therefore,
this patch extends test 74 with a (rather particular but effective)
test for the first issue, but not yet with a test for the second one.
This fixes #90.
Change-Id: Iad8b134d2f88a884f15d3fc303e463280749c467
		
	
			
		
			
				
	
	
		
			89 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			89 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| 
 | |
| #include "syslib.h"
 | |
| 
 | |
| #include <string.h>
 | |
| #include <assert.h>
 | |
| 
 | |
| #include <sys/mman.h>
 | |
| 
 | |
| #include <minix/vm.h>
 | |
| #include <minix/sysutil.h>
 | |
| 
 | |
| #include <machine/param.h>
 | |
| #include <machine/vmparam.h>
 | |
| 
 | |
| static int vm_cachecall(message *m, int call, void *addr, dev_t dev,
 | |
| 	off_t dev_offset, ino_t ino, off_t ino_offset, u32_t *flags,
 | |
| 	int blocksize, int setflags)
 | |
| {
 | |
|     if(blocksize % PAGE_SIZE)
 | |
|     	panic("blocksize %d should be a multiple of pagesize %d\n",
 | |
| 		blocksize, PAGE_SIZE);
 | |
| 
 | |
|     if(ino_offset % PAGE_SIZE)
 | |
|     	panic("inode offset %lld should be a multiple of pagesize %d\n",
 | |
| 		ino_offset, PAGE_SIZE);
 | |
| 
 | |
|     if(dev_offset % PAGE_SIZE)
 | |
|     	panic("dev offset offset %lld should be a multiple of pagesize %d\n",
 | |
| 		dev_offset, PAGE_SIZE);
 | |
| 
 | |
|     memset(m, 0, sizeof(*m));
 | |
| 
 | |
|     assert(dev != NO_DEV);
 | |
| 
 | |
|     m->m_vmmcp.dev_offset = dev_offset;
 | |
|     m->m_vmmcp.ino_offset = ino_offset;
 | |
|     m->m_vmmcp.ino = ino;
 | |
|     m->m_vmmcp.block = addr;
 | |
|     m->m_vmmcp.flags_ptr = flags;
 | |
|     m->m_vmmcp.dev = dev;
 | |
|     m->m_vmmcp.pages = blocksize / PAGE_SIZE;
 | |
|     m->m_vmmcp.flags = setflags;
 | |
| 
 | |
|     return _taskcall(VM_PROC_NR, call, m);
 | |
| }
 | |
| 
 | |
| void *vm_map_cacheblock(dev_t dev, off_t dev_offset,
 | |
| 	ino_t ino, off_t ino_offset, u32_t *flags, int blocksize)
 | |
| {
 | |
| 	message m;
 | |
| 
 | |
| 	if(vm_cachecall(&m, VM_MAPCACHEPAGE, NULL, dev, dev_offset,
 | |
| 		ino, ino_offset, flags, blocksize, 0) != OK)
 | |
| 		return MAP_FAILED;
 | |
| 
 | |
| 	return m.m_vmmcp_reply.addr;
 | |
| }
 | |
| 
 | |
| int vm_set_cacheblock(void *block, dev_t dev, off_t dev_offset,
 | |
| 	ino_t ino, off_t ino_offset, u32_t *flags, int blocksize, int setflags)
 | |
| {
 | |
| 	message m;
 | |
| 
 | |
| 	return vm_cachecall(&m, VM_SETCACHEPAGE, block, dev, dev_offset,
 | |
| 		ino, ino_offset, flags, blocksize, setflags);
 | |
| }
 | |
| 
 | |
| int vm_forget_cacheblock(dev_t dev, off_t dev_offset, int blocksize)
 | |
| {
 | |
| 	message m;
 | |
| 
 | |
| 	return vm_cachecall(&m, VM_FORGETCACHEPAGE, NULL, dev, dev_offset,
 | |
| 		VMC_NO_INODE, 0, 0, blocksize, 0);
 | |
| }
 | |
| 
 | |
| int
 | |
| vm_clear_cache(dev_t dev)
 | |
| {
 | |
| 	message m;
 | |
| 
 | |
| 	assert(dev != NO_DEV);
 | |
| 
 | |
| 	memset(&m, 0, sizeof(m));
 | |
| 
 | |
| 	m.m_vmmcp.dev = dev;
 | |
| 
 | |
| 	return _taskcall(VM_PROC_NR, VM_CLEARCACHE, &m);
 | |
| }
 |