/src/botan/src/lib/utils/mem_pool/mem_pool.cpp

Source (jump to first uncovered line)
/*
* (C) 2018,2019 Jack Lloyd
*
* Botan is released under the Simplified BSD License (see license.txt)
*/

#include <botan/internal/mem_pool.h>
#include <botan/mem_ops.h>
#include <algorithm>

#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
   #include <botan/internal/os_utils.h>
#endif

namespace Botan {

/*
* Memory pool theory of operation
*
* This allocator is not useful for general purpose but works well within the
* context of allocating cryptographic keys. It makes several assumptions which
* don't work for implementing malloc but simplify and speed up the implementation:
*
* - There is some set of pages, which cannot be expanded later. These are pages
*   which were allocated, mlocked and passed to the Memory_Pool constructor.
*
* - The allocator is allowed to return null anytime it feels like not servicing
*   a request, in which case the request will be sent to calloc instead. In
*   particular, requests which are too small or too large are rejected.
*
* - Most allocations are powers of 2, the remainder are usually a multiple of 8
*
* - Free requests include the size of the allocation, so there is no need to
*   track this within the pool.
*
* - Alignment is important to the caller. For this allocator, any allocation of
*   size N is aligned evenly at N bytes.
*
* Initially each page is in the free page list. Each page is used for just one
* size of allocation, with requests bucketed into a small number of common
* sizes. If the allocation would be too big or too small it is rejected by the pool.
*
* The free list is maintained by a bitmap, one per page/Bucket. Since each
* Bucket only maintains objects of a single size, each bit set or clear
* indicates the status of one object.
*
* An allocation walks the list of buckets and asks each in turn if there is
* space. If a Bucket does not have any space, it sets a boolean flag m_is_full
* so that it does not need to rescan when asked again. The flag is cleared on
* first free from that bucket. If no bucket has space, but there are some free
* pages left, a free page is claimed as a new Bucket for that size. In this case
* it is pushed to the front of the list so it is first in line to service new
* requests.
*
* A deallocation also walks the list of buckets for the size and asks each
* Bucket in turn if it recognizes the pointer. When a Bucket becomes empty as a
* result of a deallocation, it is recycled back into the free pool. When this
* happens, the Buckets page goes to the end of the free list. All pages on the
* free list are marked in the MMU as noaccess, so anything touching them will
* immediately crash. They are only marked R/W once placed into a new bucket.
* Making the free list FIFO maximizes the time between the last free of a bucket
* and that page being writable again, maximizing chances of crashing after a
* use-after-free.
*
* Future work
* -------------
*
* The allocator is protected by a global lock. It would be good to break this
* up, since almost all of the work can actually be done in parallel especially
* when allocating objects of different sizes (which can't possibly share a
* bucket).
*
* It may be worthwhile to optimize deallocation by storing the Buckets in order
* (by pointer value) which would allow binary search to find the owning bucket.
*
* A useful addition would be to randomize the allocations. Memory_Pool would be
* changed to receive also a RandomNumberGenerator& object (presumably the system
* RNG, or maybe a ChaCha_RNG seeded with system RNG). Then the bucket to use and
* the offset within the bucket would be chosen randomly, instead of using first fit.
*
* Right now we don't make any provision for threading, so if two threads both
* allocate 32 byte values one after the other, the two allocations will likely
* share a cache line. Ensuring that distinct threads will (tend to) use distinct
* buckets would reduce this.
*
* Supporting a realloc-style API may be useful.
*/

namespace {

size_t choose_bucket(size_t n)
   {
   const size_t MINIMUM_ALLOCATION = 16;
   const size_t MAXIMUM_ALLOCATION = 256;

   if(n < MINIMUM_ALLOCATION || n > MAXIMUM_ALLOCATION)
      return 0;

   // Need to tune these

   const size_t buckets[] = {
      16, 24, 32, 48, 64, 80, 96, 112, 128, 160, 192, 256, 0,
   };

   for(size_t i = 0; buckets[i]; ++i)
      {
      if(n <= buckets[i])
         {
         return buckets[i];
         }
      }

   return 0;
   }

inline bool ptr_in_pool(const void* pool_ptr, size_t poolsize,
                        const void* buf_ptr, size_t bufsize)
   {
   const uintptr_t pool = reinterpret_cast<uintptr_t>(pool_ptr);
   const uintptr_t buf = reinterpret_cast<uintptr_t>(buf_ptr);
   return (buf >= pool) && (buf + bufsize <= pool + poolsize);
   }

// return index of first set bit
template<typename T>
size_t find_set_bit(T b)
   {
   size_t s = 8*sizeof(T) / 2;
   size_t bit = 0;

   // In this context we don't need to be const-time
   while(s > 0)
      {
      const T mask = (static_cast<T>(1) << s) - 1;
      if((b & mask) == 0)
         {
         bit += s;
         b >>= s;
         }
      s /= 2;
      }

   return bit;
   }

class BitMap final
   {
   public:
      BitMap(size_t bits) : m_len(bits)
         {
         m_bits.resize((bits + BITMASK_BITS - 1) / BITMASK_BITS);
         m_main_mask = static_cast<bitmask_type>(~0);
         m_last_mask = m_main_mask;

         if(bits % BITMASK_BITS != 0)
            m_last_mask = (static_cast<bitmask_type>(1) << (bits % BITMASK_BITS)) - 1;
         }

      bool find_free(size_t* bit);

      void free(size_t bit)
         {
         BOTAN_ASSERT_NOMSG(bit <= m_len);
         const size_t w = bit / BITMASK_BITS;
         BOTAN_ASSERT_NOMSG(w < m_bits.size());
         const bitmask_type mask = static_cast<bitmask_type>(1) << (bit % BITMASK_BITS);
         m_bits[w] = m_bits[w] & (~mask);
         }

      bool empty() const
         {
         for(size_t i = 0; i != m_bits.size(); ++i)
            {
            if(m_bits[i] != 0)
               {
               return false;
               }
            }

         return true;
         }

  private:
#if defined(BOTAN_ENABLE_DEBUG_ASSERTS)
      typedef uint8_t bitmask_type;
      enum { BITMASK_BITS = 8 };
#else
      typedef word bitmask_type;
      enum { BITMASK_BITS = BOTAN_MP_WORD_BITS };
#endif

      size_t m_len;
      bitmask_type m_main_mask;
      bitmask_type m_last_mask;
      std::vector<bitmask_type> m_bits;
   };

bool BitMap::find_free(size_t* bit)
   {
   for(size_t i = 0; i != m_bits.size(); ++i)
      {
      const bitmask_type mask = (i == m_bits.size() - 1) ? m_last_mask : m_main_mask;
      if((m_bits[i] & mask) != mask)
         {
         size_t free_bit = find_set_bit(~m_bits[i]);
         const bitmask_type bmask = static_cast<bitmask_type>(1) << (free_bit % BITMASK_BITS);
         BOTAN_ASSERT_NOMSG((m_bits[i] & bmask) == 0);
         m_bits[i] |= bmask;
         *bit = BITMASK_BITS*i + free_bit;
         return true;
         }
      }

   return false;
   }

}

class Bucket final
   {
   public:
      Bucket(uint8_t* mem, size_t mem_size, size_t item_size) :
         m_item_size(item_size),
         m_page_size(mem_size),
         m_range(mem),
         m_bitmap(mem_size / item_size),
         m_is_full(false)
         {
         }

      uint8_t* alloc()
         {
         if(m_is_full)
            {
            // I know I am full
            return nullptr;
            }

         size_t offset;
         if(!m_bitmap.find_free(&offset))
            {
            // I just found out I am full
            m_is_full = true;
            return nullptr;
            }

         BOTAN_ASSERT(offset * m_item_size < m_page_size, "Offset is in range");
         return m_range + m_item_size*offset;
         }

      bool free(void* p)
         {
         if(!in_this_bucket(p))
            return false;

         /*
         Zero also any trailing bytes, which should not have been written to,
         but maybe the user was bad and wrote past the end.
         */
         std::memset(p, 0, m_item_size);

         const size_t offset = (reinterpret_cast<uintptr_t>(p) - reinterpret_cast<uintptr_t>(m_range)) / m_item_size;

         m_bitmap.free(offset);
         m_is_full = false;

         return true;
         }

      bool in_this_bucket(void* p) const
         {
         return ptr_in_pool(m_range, m_page_size, p, m_item_size);
         }

      bool empty() const
         {
         return m_bitmap.empty();
         }

      uint8_t* ptr() const
         {
         return m_range;
         }

   private:
      size_t m_item_size;
      size_t m_page_size;
      uint8_t* m_range;
      BitMap m_bitmap;
      bool m_is_full;
   };

Memory_Pool::Memory_Pool(const std::vector<void*>& pages, size_t page_size) :
   m_page_size(page_size)
   {
   m_min_page_ptr = ~static_cast<uintptr_t>(0);
   m_max_page_ptr = 0;

   for(size_t i = 0; i != pages.size(); ++i)
      {
      const uintptr_t p = reinterpret_cast<uintptr_t>(pages[i]);

      m_min_page_ptr = std::min(p, m_min_page_ptr);
      m_max_page_ptr = std::max(p, m_max_page_ptr);

      clear_bytes(pages[i], m_page_size);
#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
      OS::page_prohibit_access(pages[i]);
#endif
      m_free_pages.push_back(static_cast<uint8_t*>(pages[i]));
      }

   /*
   Right now this points to the start of the last page, adjust it to instead
   point to the first byte of the following page
   */
   m_max_page_ptr += page_size;
   }

Memory_Pool::~Memory_Pool()
   {
#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
   for(size_t i = 0; i != m_free_pages.size(); ++i)
      {
      OS::page_allow_access(m_free_pages[i]);
      }
#endif
   }

void* Memory_Pool::allocate(size_t n)
   {
   if(n > m_page_size)
      return nullptr;

   const size_t n_bucket = choose_bucket(n);

   if(n_bucket > 0)
      {
      lock_guard_type<mutex_type> lock(m_mutex);

      std::deque<Bucket>& buckets = m_buckets_for[n_bucket];

      /*
      It would be optimal to pick the bucket with the most usage,
      since a bucket with say 1 item allocated out of it has a high
      chance of becoming later freed and then the whole page can be
      recycled.
      */
      for(auto& bucket : buckets)
         {
         if(uint8_t* p = bucket.alloc())
            return p;

         // If the bucket is full, maybe move it to the end of the list?
         // Otoh bucket search should be very fast
         }

      if(m_free_pages.size() > 0)
         {
         uint8_t* ptr = m_free_pages[0];
         m_free_pages.pop_front();
#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
         OS::page_allow_access(ptr);
#endif
         buckets.push_front(Bucket(ptr, m_page_size, n_bucket));
         void* p = buckets[0].alloc();
         BOTAN_ASSERT_NOMSG(p != nullptr);
         return p;
         }
      }

   // out of room
   return nullptr;
   }

bool Memory_Pool::deallocate(void* p, size_t len) noexcept
   {
   // Do a fast range check first, before taking the lock
   const uintptr_t p_val = reinterpret_cast<uintptr_t>(p);
   if(p_val < m_min_page_ptr || p_val > m_max_page_ptr)
      return false;

   const size_t n_bucket = choose_bucket(len);

   if(n_bucket != 0)
      {
      try
         {
         lock_guard_type<mutex_type> lock(m_mutex);

         std::deque<Bucket>& buckets = m_buckets_for[n_bucket];

         for(size_t i = 0; i != buckets.size(); ++i)
            {
            Bucket& bucket = buckets[i];
            if(bucket.free(p))
               {
               if(bucket.empty())
                  {
#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
                  OS::page_prohibit_access(bucket.ptr());
#endif
                  m_free_pages.push_back(bucket.ptr());

                  if(i != buckets.size() - 1)
                     std::swap(buckets.back(), buckets[i]);
                  buckets.pop_back();
                  }
               return true;
               }
            }
         }
      catch(...)
         {
         /*
         * The only exception throws that can occur in the above code are from
         * either the STL or BOTAN_ASSERT failures. In either case, such an
         * error indicates a logic error or data corruption in the memory
         * allocator such that it is no longer safe to continue executing.
         *
         * Since this function is noexcept, simply letting the exception escape
         * is sufficient for terminate to be called. However in this scenario
         * it is implementation defined if any stack unwinding is performed.
         * Since stack unwinding could cause further memory deallocations this
         * could result in further corruption in this allocator state. To prevent
         * this, call terminate directly.
         */
         std::terminate();
         }
      }

   return false;
   }

}

Coverage Report

Created: 2020-11-21 08:34

Line	Count	Source (jump to first uncovered line)
1		/*
2		* (C) 2018,2019 Jack Lloyd
3		*
4		* Botan is released under the Simplified BSD License (see license.txt)
5		*/
6
7		#include <botan/internal/mem_pool.h>
8		#include <botan/mem_ops.h>
9		#include <algorithm>
10
11		#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
12		#include <botan/internal/os_utils.h>
13		#endif
14
15		namespace Botan {
16
17		/*
18		* Memory pool theory of operation
19		*
20		* This allocator is not useful for general purpose but works well within the
21		* context of allocating cryptographic keys. It makes several assumptions which
22		* don't work for implementing malloc but simplify and speed up the implementation:
23		*
24		* - There is some set of pages, which cannot be expanded later. These are pages
25		* which were allocated, mlocked and passed to the Memory_Pool constructor.
26		*
27		* - The allocator is allowed to return null anytime it feels like not servicing
28		* a request, in which case the request will be sent to calloc instead. In
29		* particular, requests which are too small or too large are rejected.
30		*
31		* - Most allocations are powers of 2, the remainder are usually a multiple of 8
32		*
33		* - Free requests include the size of the allocation, so there is no need to
34		* track this within the pool.
35		*
36		* - Alignment is important to the caller. For this allocator, any allocation of
37		* size N is aligned evenly at N bytes.
38		*
39		* Initially each page is in the free page list. Each page is used for just one
40		* size of allocation, with requests bucketed into a small number of common
41		* sizes. If the allocation would be too big or too small it is rejected by the pool.
42		*
43		* The free list is maintained by a bitmap, one per page/Bucket. Since each
44		* Bucket only maintains objects of a single size, each bit set or clear
45		* indicates the status of one object.
46		*
47		* An allocation walks the list of buckets and asks each in turn if there is
48		* space. If a Bucket does not have any space, it sets a boolean flag m_is_full
49		* so that it does not need to rescan when asked again. The flag is cleared on
50		* first free from that bucket. If no bucket has space, but there are some free
51		* pages left, a free page is claimed as a new Bucket for that size. In this case
52		* it is pushed to the front of the list so it is first in line to service new
53		* requests.
54		*
55		* A deallocation also walks the list of buckets for the size and asks each
56		* Bucket in turn if it recognizes the pointer. When a Bucket becomes empty as a
57		* result of a deallocation, it is recycled back into the free pool. When this
58		* happens, the Buckets page goes to the end of the free list. All pages on the
59		* free list are marked in the MMU as noaccess, so anything touching them will
60		* immediately crash. They are only marked R/W once placed into a new bucket.
61		* Making the free list FIFO maximizes the time between the last free of a bucket
62		* and that page being writable again, maximizing chances of crashing after a
63		* use-after-free.
64		*
65		* Future work
66		* -------------
67		*
68		* The allocator is protected by a global lock. It would be good to break this
69		* up, since almost all of the work can actually be done in parallel especially
70		* when allocating objects of different sizes (which can't possibly share a
71		* bucket).
72		*
73		* It may be worthwhile to optimize deallocation by storing the Buckets in order
74		* (by pointer value) which would allow binary search to find the owning bucket.
75		*
76		* A useful addition would be to randomize the allocations. Memory_Pool would be
77		* changed to receive also a RandomNumberGenerator& object (presumably the system
78		* RNG, or maybe a ChaCha_RNG seeded with system RNG). Then the bucket to use and
79		* the offset within the bucket would be chosen randomly, instead of using first fit.
80		*
81		* Right now we don't make any provision for threading, so if two threads both
82		* allocate 32 byte values one after the other, the two allocations will likely
83		* share a cache line. Ensuring that distinct threads will (tend to) use distinct
84		* buckets would reduce this.
85		*
86		* Supporting a realloc-style API may be useful.
87		*/
88
89		namespace {
90
91		size_t choose_bucket(size_t n)
92	244k	{
93	244k	const size_t MINIMUM_ALLOCATION = 16;
94	244k	const size_t MAXIMUM_ALLOCATION = 256;
95
96	244k	if(n < MINIMUM_ALLOCATION \|\| n > MAXIMUM_ALLOCATION)
97	1.07k	return 0;
98
99		// Need to tune these
100
101	243k	const size_t buckets[] = {
102	243k	16, 24, 32, 48, 64, 80, 96, 112, 128, 160, 192, 256, 0,
103	243k	};
104
105	857k	for(size_t i = 0; buckets[i]; ++i)
106	857k	{
107	857k	if(n <= buckets[i])
108	243k	{
109	243k	return buckets[i];
110	243k	}
111	857k	}
112
113	0	return 0;
114	243k	}
115
116		inline bool ptr_in_pool(const void* pool_ptr, size_t poolsize,
117		const void* buf_ptr, size_t bufsize)
118	103k	{
119	103k	const uintptr_t pool = reinterpret_cast<uintptr_t>(pool_ptr);
120	103k	const uintptr_t buf = reinterpret_cast<uintptr_t>(buf_ptr);
121	103k	return (buf >= pool) && (buf + bufsize <= pool + poolsize);
122	103k	}
123
124		// return index of first set bit
125		template<typename T>
126		size_t find_set_bit(T b)
127	128k	{
128	128k	size_t s = 8*sizeof(T) / 2;
129	128k	size_t bit = 0;
130
131		// In this context we don't need to be const-time
132	897k	while(s > 0)
133	769k	{
134	769k	const T mask = (static_cast<T>(1) << s) - 1;
135	769k	if((b & mask) == 0)
136	116k	{
137	116k	bit += s;
138	116k	b >>= s;
139	116k	}
140	769k	s /= 2;
141	769k	}
142
143	128k	return bit;
144	128k	}
145
146		class BitMap final
147		{
148		public:
149		BitMap(size_t bits) : m_len(bits)
150	70.8k	{
151	70.8k	m_bits.resize((bits + BITMASK_BITS - 1) / BITMASK_BITS);
152	70.8k	m_main_mask = static_cast<bitmask_type>(~0);
153	70.8k	m_last_mask = m_main_mask;
154
155	70.8k	if(bits % BITMASK_BITS != 0)
156	17.4k	m_last_mask = (static_cast<bitmask_type>(1) << (bits % BITMASK_BITS)) - 1;
157	70.8k	}
158
159		bool find_free(size_t* bit);
160
161		void free(size_t bit)
162	99.1k	{
163	99.1k	BOTAN_ASSERT_NOMSG(bit <= m_len);
164	99.1k	const size_t w = bit / BITMASK_BITS;
165	99.1k	BOTAN_ASSERT_NOMSG(w < m_bits.size());
166	99.1k	const bitmask_type mask = static_cast<bitmask_type>(1) << (bit % BITMASK_BITS);
167	99.1k	m_bits[w] = m_bits[w] & (~mask);
168	99.1k	}
169
170		bool empty() const
171	99.1k	{
172	320k	for(size_t i = 0; i != m_bits.size(); ++i)
173	252k	{
174	252k	if(m_bits[i] != 0)
175	30.8k	{
176	30.8k	return false;
177	30.8k	}
178	252k	}
179
180	68.2k	return true;
181	99.1k	}
182
183		private:
184		#if defined(BOTAN_ENABLE_DEBUG_ASSERTS)
185		typedef uint8_t bitmask_type;
186		enum { BITMASK_BITS = 8 };
187		#else
188		typedef word bitmask_type;
189		enum { BITMASK_BITS = BOTAN_MP_WORD_BITS };
190		#endif
191
192		size_t m_len;
193		bitmask_type m_main_mask;
194		bitmask_type m_last_mask;
195		std::vector<bitmask_type> m_bits;
196		};
197
198		bool BitMap::find_free(size_t* bit)
199	128k	{
200	144k	for(size_t i = 0; i != m_bits.size(); ++i)
201	143k	{
202	101k	const bitmask_type mask = (i == m_bits.size() - 1) ? m_last_mask : m_main_mask;
203	143k	if((m_bits[i] & mask) != mask)
204	128k	{
205	128k	size_t free_bit = find_set_bit(~m_bits[i]);
206	128k	const bitmask_type bmask = static_cast<bitmask_type>(1) << (free_bit % BITMASK_BITS);
207	128k	BOTAN_ASSERT_NOMSG((m_bits[i] & bmask) == 0);
208	128k	m_bits[i] \|= bmask;
209	128k	bit = BITMASK_BITSi + free_bit;
210	128k	return true;
211	128k	}
212	143k	}
213
214	458	return false;
215	128k	}
216
217		}
218
219		class Bucket final
220		{
221		public:
222		Bucket(uint8_t* mem, size_t mem_size, size_t item_size) :
223		m_item_size(item_size),
224		m_page_size(mem_size),
225		m_range(mem),
226		m_bitmap(mem_size / item_size),
227		m_is_full(false)
228	70.8k	{
229	70.8k	}
230
231		uint8_t* alloc()
232	143k	{
233	143k	if(m_is_full)
234	14.5k	{
235		// I know I am full
236	14.5k	return nullptr;
237	14.5k	}
238
239	128k	size_t offset;
240	128k	if(!m_bitmap.find_free(&offset))
241	458	{
242		// I just found out I am full
243	458	m_is_full = true;
244	458	return nullptr;
245	458	}
246
247	128k	BOTAN_ASSERT(offset * m_item_size < m_page_size, "Offset is in range");
248	128k	return m_range + m_item_size*offset;
249	128k	}
250
251		bool free(void* p)
252	103k	{
253	103k	if(!in_this_bucket(p))
254	4.09k	return false;
255
256		/*
257		Zero also any trailing bytes, which should not have been written to,
258		but maybe the user was bad and wrote past the end.
259		*/
260	99.1k	std::memset(p, 0, m_item_size);
261
262	99.1k	const size_t offset = (reinterpret_cast<uintptr_t>(p) - reinterpret_cast<uintptr_t>(m_range)) / m_item_size;
263
264	99.1k	m_bitmap.free(offset);
265	99.1k	m_is_full = false;
266
267	99.1k	return true;
268	99.1k	}
269
270		bool in_this_bucket(void* p) const
271	103k	{
272	103k	return ptr_in_pool(m_range, m_page_size, p, m_item_size);
273	103k	}
274
275		bool empty() const
276	99.1k	{
277	99.1k	return m_bitmap.empty();
278	99.1k	}
279
280		uint8_t* ptr() const
281	68.2k	{
282	68.2k	return m_range;
283	68.2k	}
284
285		private:
286		size_t m_item_size;
287		size_t m_page_size;
288		uint8_t* m_range;
289		BitMap m_bitmap;
290		bool m_is_full;
291		};
292
293		Memory_Pool::Memory_Pool(const std::vector<void*>& pages, size_t page_size) :
294		m_page_size(page_size)
295	1.27k	{
296	1.27k	m_min_page_ptr = ~static_cast<uintptr_t>(0);
297	1.27k	m_max_page_ptr = 0;
298
299	6.39k	for(size_t i = 0; i != pages.size(); ++i)
300	5.11k	{
301	5.11k	const uintptr_t p = reinterpret_cast<uintptr_t>(pages[i]);
302
303	5.11k	m_min_page_ptr = std::min(p, m_min_page_ptr);
304	5.11k	m_max_page_ptr = std::max(p, m_max_page_ptr);
305
306	5.11k	clear_bytes(pages[i], m_page_size);
307		#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
308		OS::page_prohibit_access(pages[i]);
309		#endif
310	5.11k	m_free_pages.push_back(static_cast<uint8_t*>(pages[i]));
311	5.11k	}
312
313		/*
314		Right now this points to the start of the last page, adjust it to instead
315		point to the first byte of the following page
316		*/
317	1.27k	m_max_page_ptr += page_size;
318	1.27k	}
319
320		Memory_Pool::~Memory_Pool()
321	1.27k	{
322		#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
323		for(size_t i = 0; i != m_free_pages.size(); ++i)
324		{
325		OS::page_allow_access(m_free_pages[i]);
326		}
327		#endif
328	1.27k	}
329
330		void* Memory_Pool::allocate(size_t n)
331	145k	{
332	145k	if(n > m_page_size)
333	0	return nullptr;
334
335	145k	const size_t n_bucket = choose_bucket(n);
336
337	145k	if(n_bucket > 0)
338	144k	{
339	144k	lock_guard_type<mutex_type> lock(m_mutex);
340
341	144k	std::deque<Bucket>& buckets = m_buckets_for[n_bucket];
342
343		/*
344		It would be optimal to pick the bucket with the most usage,
345		since a bucket with say 1 item allocated out of it has a high
346		chance of becoming later freed and then the whole page can be
347		recycled.
348		*/
349	144k	for(auto& bucket : buckets)
350	72.3k	{
351	72.3k	if(uint8_t* p = bucket.alloc())
352	57.3k	return p;
353
354		// If the bucket is full, maybe move it to the end of the list?
355		// Otoh bucket search should be very fast
356	72.3k	}
357
358	87.1k	if(m_free_pages.size() > 0)
359	70.8k	{
360	70.8k	uint8_t* ptr = m_free_pages[0];
361	70.8k	m_free_pages.pop_front();
362		#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
363		OS::page_allow_access(ptr);
364		#endif
365	70.8k	buckets.push_front(Bucket(ptr, m_page_size, n_bucket));
366	70.8k	void* p = buckets[0].alloc();
367	70.8k	BOTAN_ASSERT_NOMSG(p != nullptr);
368	70.8k	return p;
369	70.8k	}
370	17.3k	}
371
372		// out of room
373	17.3k	return nullptr;
374	17.3k	}
375
376		bool Memory_Pool::deallocate(void* p, size_t len) noexcept
377	99.1k	{
378		// Do a fast range check first, before taking the lock
379	99.1k	const uintptr_t p_val = reinterpret_cast<uintptr_t>(p);
380	99.1k	if(p_val < m_min_page_ptr \|\| p_val > m_max_page_ptr)
381	0	return false;
382
383	99.1k	const size_t n_bucket = choose_bucket(len);
384
385	99.1k	if(n_bucket != 0)
386	99.1k	{
387	99.1k	try
388	99.1k	{
389	99.1k	lock_guard_type<mutex_type> lock(m_mutex);
390
391	99.1k	std::deque<Bucket>& buckets = m_buckets_for[n_bucket];
392
393	103k	for(size_t i = 0; i != buckets.size(); ++i)
394	103k	{
395	103k	Bucket& bucket = buckets[i];
396	103k	if(bucket.free(p))
397	99.1k	{
398	99.1k	if(bucket.empty())
399	68.2k	{
400		#if defined(BOTAN_MEM_POOL_USE_MMU_PROTECTIONS)
401		OS::page_prohibit_access(bucket.ptr());
402		#endif
403	68.2k	m_free_pages.push_back(bucket.ptr());
404
405	68.2k	if(i != buckets.size() - 1)
406	1.16k	std::swap(buckets.back(), buckets[i]);
407	68.2k	buckets.pop_back();
408	68.2k	}
409	99.1k	return true;
410	99.1k	}
411	103k	}
412	99.1k	}
413	99.1k	catch(...)
414	0	{
415		/*
416		* The only exception throws that can occur in the above code are from
417		* either the STL or BOTAN_ASSERT failures. In either case, such an
418		* error indicates a logic error or data corruption in the memory
419		* allocator such that it is no longer safe to continue executing.
420		*
421		* Since this function is noexcept, simply letting the exception escape
422		* is sufficient for terminate to be called. However in this scenario
423		* it is implementation defined if any stack unwinding is performed.
424		* Since stack unwinding could cause further memory deallocations this
425		* could result in further corruption in this allocator state. To prevent
426		* this, call terminate directly.
427		*/
428	0	std::terminate();
429	0	}
430	99.1k	}
431
432	0	return false;
433	99.1k	}
434
435		}