from __future__ import print_function from .lib import TestBase, FileCreator from smmap.mman import ( WindowCursor, SlidingWindowMapManager, StaticWindowMapManager ) from smmap.util import align_to_mmap from random import randint from time import time import os import sys from copy import copy class TestMMan(TestBase): def test_cursor(self): with FileCreator(self.k_window_test_size, "cursor_test") as fc: man = SlidingWindowMapManager() ci = WindowCursor(man) # invalid cursor assert not ci.is_valid() assert not ci.is_associated() assert ci.size() == 0 # this is cached, so we can query it in invalid state cv = man.make_cursor(fc.path) assert not cv.is_valid() # no region mapped yet assert cv.is_associated() # but it know where to map it from assert cv.file_size() == fc.size assert cv.path() == fc.path # copy module cio = copy(cv) assert not cio.is_valid() and cio.is_associated() # assign method assert not ci.is_associated() ci.assign(cv) assert not ci.is_valid() and ci.is_associated() # unuse non-existing region is fine cv.unuse_region() cv.unuse_region() # destruction is fine (even multiple times) cv._destroy() WindowCursor(man)._destroy() def test_memory_manager(self): slide_man = SlidingWindowMapManager() static_man = StaticWindowMapManager() for man in (static_man, slide_man): assert man.num_file_handles() == 0 assert man.num_open_files() == 0 winsize_cmp_val = 0 if isinstance(man, StaticWindowMapManager): winsize_cmp_val = -1 # END handle window size assert man.window_size() > winsize_cmp_val assert man.mapped_memory_size() == 0 assert man.max_mapped_memory_size() > 0 # collection doesn't raise in 'any' mode man._collect_lru_region(0) # doesn't raise if we are within the limit man._collect_lru_region(10) # doesn't fail if we over-allocate assert man._collect_lru_region(sys.maxsize) == 0 # use a region, verify most basic functionality with FileCreator(self.k_window_test_size, "manager_test") as fc: fd = os.open(fc.path, os.O_RDONLY) try: for item in (fc.path, fd): c = man.make_cursor(item) assert c.path_or_fd() is item assert c.use_region(10, 10).is_valid() assert c.ofs_begin() == 10 assert c.size() == 10 with open(fc.path, 'rb') as fp: assert c.buffer()[:] == fp.read(20)[10:] if isinstance(item, int): self.assertRaises(ValueError, c.path) else: self.assertRaises(ValueError, c.fd) # END handle value error # END for each input finally: os.close(fd) # END for each manasger type def test_memman_operation(self): # test more access, force it to actually unmap regions with FileCreator(self.k_window_test_size, "manager_operation_test") as fc: with open(fc.path, 'rb') as fp: data = fp.read() fd = os.open(fc.path, os.O_RDONLY) try: max_num_handles = 15 # small_size = for mtype, args in ((StaticWindowMapManager, (0, fc.size // 3, max_num_handles)), (SlidingWindowMapManager, (fc.size // 100, fc.size // 3, max_num_handles)),): for item in (fc.path, fd): assert len(data) == fc.size # small windows, a reasonable max memory. Not too many regions at once man = mtype(window_size=args[0], max_memory_size=args[1], max_open_handles=args[2]) c = man.make_cursor(item) # still empty (more about that is tested in test_memory_manager() assert man.num_open_files() == 0 assert man.mapped_memory_size() == 0 base_offset = 5000 # window size is 0 for static managers, hence size will be 0. We take that into consideration size = man.window_size() // 2 assert c.use_region(base_offset, size).is_valid() rr = c.region() assert rr.client_count() == 2 # the manager and the cursor and us assert man.num_open_files() == 1 assert man.num_file_handles() == 1 assert man.mapped_memory_size() == rr.size() # assert c.size() == size # the cursor may overallocate in its static version assert c.ofs_begin() == base_offset assert rr.ofs_begin() == 0 # it was aligned and expanded if man.window_size(): # but isn't larger than the max window (aligned) assert rr.size() == align_to_mmap(man.window_size(), True) else: assert rr.size() == fc.size # END ignore static managers which dont use windows and are aligned to file boundaries assert c.buffer()[:] == data[base_offset:base_offset + (size or c.size())] # obtain second window, which spans the first part of the file - it is a still the same window nsize = (size or fc.size) - 10 assert c.use_region(0, nsize).is_valid() assert c.region() == rr assert man.num_file_handles() == 1 assert c.size() == nsize assert c.ofs_begin() == 0 assert c.buffer()[:] == data[:nsize] # map some part at the end, our requested size cannot be kept overshoot = 4000 base_offset = fc.size - (size or c.size()) + overshoot assert c.use_region(base_offset, size).is_valid() if man.window_size(): assert man.num_file_handles() == 2 assert c.size() < size assert c.region() is not rr # old region is still available, but has not curser ref anymore assert rr.client_count() == 1 # only held by manager else: assert c.size() < fc.size # END ignore static managers which only have one handle per file rr = c.region() assert rr.client_count() == 2 # manager + cursor assert rr.ofs_begin() < c.ofs_begin() # it should have extended itself to the left assert rr.ofs_end() <= fc.size # it cannot be larger than the file assert c.buffer()[:] == data[base_offset:base_offset + (size or c.size())] # unising a region makes the cursor invalid c.unuse_region() assert not c.is_valid() if man.window_size(): # but doesn't change anything regarding the handle count - we cache it and only # remove mapped regions if we have to assert man.num_file_handles() == 2 # END ignore this for static managers # iterate through the windows, verify data contents # this will trigger map collection after a while max_random_accesses = 5000 num_random_accesses = max_random_accesses memory_read = 0 st = time() # cache everything to get some more performance includes_ofs = c.includes_ofs max_mapped_memory_size = man.max_mapped_memory_size() max_file_handles = man.max_file_handles() mapped_memory_size = man.mapped_memory_size num_file_handles = man.num_file_handles while num_random_accesses: num_random_accesses -= 1 base_offset = randint(0, fc.size - 1) # precondition if man.window_size(): assert max_mapped_memory_size >= mapped_memory_size() # END statics will overshoot, which is fine assert max_file_handles >= num_file_handles() assert c.use_region(base_offset, (size or c.size())).is_valid() csize = c.size() assert c.buffer()[:] == data[base_offset:base_offset + csize] memory_read += csize assert includes_ofs(base_offset) assert includes_ofs(base_offset + csize - 1) assert not includes_ofs(base_offset + csize) # END while we should do an access elapsed = max(time() - st, 0.001) # prevent zero divison errors on windows mb = float(1000 * 1000) print("%s: Read %i mb of memory with %i random on cursor initialized with %s accesses in %fs (%f mb/s)\n" % (mtype, memory_read / mb, max_random_accesses, type(item), elapsed, (memory_read / mb) / elapsed), file=sys.stderr) # an offset as large as the size doesn't work ! assert not c.use_region(fc.size, size).is_valid() # collection - it should be able to collect all assert man.num_file_handles() assert man.collect() assert man.num_file_handles() == 0 # END for each item # END for each manager type finally: os.close(fd)