Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code

qemu-devel

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_g

From:	Richard Henderson
Subject:	Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer
Date:	Thu, 20 Jul 2017 11:22:10 -1000
User-agent:	Mozilla/5.0 (X11; Linux x86_64; rv:52.0) Gecko/20100101 Thunderbird/52.2.1

On 07/20/2017 10:50 AM, Emilio G. Cota wrote:

On Wed, Jul 19, 2017 at 22:04:50 -1000, Richard Henderson wrote:

On 07/19/2017 05:09 PM, Emilio G. Cota wrote:

+    /* We do not yet support multiple TCG contexts, so use one region for now 
*/
+    n_regions = 1;
+
+    /* start on a page-aligned address */
+    buf = QEMU_ALIGN_PTR_UP(buf, qemu_real_host_page_size);
+    g_assert(buf < tcg_init_ctx.code_gen_buffer + size);
+
+    /* discard that initial portion */
+    size -= buf - tcg_init_ctx.code_gen_buffer;


It seems pointless wasting most of a page after the prologue when n_regions
== 1.  We don't really need to start on a page boundary in that case.

+    /* make region_size a multiple of page_size */
+    region_size = size / n_regions;
+    region_size = QEMU_ALIGN_DOWN(region_size, qemu_real_host_page_size);


This division can result in a number of pages at the end of the region being
unused.  Is it worthwhile freeing them?  Or marking them mprotect_none along
with the last guard page?


Perhaps we should then enlarge both the first and last regions so that we
fully use the buffer.


I really like the idea.  That's a lot of space recovered for 64k page hosts.

I do think we can make the computation clearer.  How about

  static void tcg_region_assign(TCGContext *s, size_t curr_region)
  {
+    void *aligned = QEMU_ALIGN_PTR_UP(region.start, qemu_real_host_page_size);
      void *buf;
+    size_t size = region.size;

- buf = region.buf + curr_region * (region.size + qemu_real_host_page_size);

+    /* The beginning of the first region might not be page-aligned */
+    if (curr_region == 0) {
+        buf = region.start;
+        size += aligned - buf;
+    } else {
+        buf = aligned + curr_region * (region.size +  
qemu_real_host_page_size);
+    }
+    /* the last region might be larger than region.size */
+    if (curr_region == region.n - 1) {
+        void *aligned_end = buf + size;
+
+        size += region.end - qemu_real_host_page_size - aligned_end;
+    }
      s->code_gen_buffer = buf;
      s->code_gen_ptr = buf;
-    s->code_gen_buffer_size = region.size;
-    s->code_gen_highwater = buf + region.size - TCG_HIGHWATER;
+    s->code_gen_buffer_size = size;
+    s->code_gen_highwater = buf + size - TCG_HIGHWATER;
  }


static inline void tcg_region_bounds(TCGContext *s, size_t curr_region,
                                     void **pstart, void **pend)
{
  void *start, *end;

  /* ??? Maybe store "aligned" precomputed.  */
  start = QEMU_ALIGN_PTR_UP(region.start, qemu_real_host_page_size);
  /* ??? Maybe store "stride" precomputed.  */
  start += curr_region * (region.size + qemu_real_host_page_size);
  end = start + region.size;

  if (curr_region == 0) {
    start = region.start;
  }
  if (curr_region == region.n - 1) {
    end = region.end;
  }

  *pstart = start;
  *pend = end;
}

static void tcg_region_assign(TCGContext *s, size_t curr_region)
{
  void *start, *end;

  tcg_region_bounds(s, curr_region, &start, &end);

  s->code_gen_buffer = start;
  s->code_gen_ptr = start;
  s->code_gen_buffer_size = end - start;
  s->code_gen_highwater = end - TCG_HIGHWATER;
}

@@ -409,44 +424,50 @@ static size_t tcg_n_regions(void)
  void tcg_region_init(void)
  {
      void *buf = tcg_init_ctx.code_gen_buffer;
+    void *aligned;
      size_t size = tcg_init_ctx.code_gen_buffer_size;
+    size_t page_size = qemu_real_host_page_size;
      size_t region_size;
      size_t n_regions;
      size_t i;
+    int rc;

n_regions = tcg_n_regions();- /* start on a page-aligned address */

-    buf = QEMU_ALIGN_PTR_UP(buf, qemu_real_host_page_size);
-    g_assert(buf < tcg_init_ctx.code_gen_buffer + size);
-
-    /* discard that initial portion */
-    size -= buf - tcg_init_ctx.code_gen_buffer;
-
-    /* make region_size a multiple of page_size */
-    region_size = size / n_regions;
-    region_size = QEMU_ALIGN_DOWN(region_size, qemu_real_host_page_size);
+    /* The first region will be 'aligned - buf' bytes larger than the others */
+    aligned = QEMU_ALIGN_PTR_UP(buf, page_size);
+    g_assert(aligned < tcg_init_ctx.code_gen_buffer + size);
+    /*
+     * Make region_size a multiple of page_size, using aligned as the start.
+     * As a result of this we might end up with a few extra pages at the end of
+     * the buffer; we will assign those to the last region.
+     */
+    region_size = (size - (aligned - buf)) / n_regions;
+    region_size = QEMU_ALIGN_DOWN(region_size, page_size);

/* A region must have at least 2 pages; one code, one guard */

-    g_assert(region_size >= 2 * qemu_real_host_page_size);
+    g_assert(region_size >= 2 * page_size);

/* init the region struct */

      qemu_mutex_init(&region.lock);
      region.n = n_regions;
-    region.buf = buf;
+    region.start = buf;
+    /* page-align the end, since its last page will be a guard page */
+    region.end = QEMU_ALIGN_PTR_DOWN(buf + size, page_size);
      /* do not count the guard page in region.size */
-    region.size = region_size - qemu_real_host_page_size;
+    region.size = region_size - page_size;

- /* set guard pages */

-    for (i = 0; i < region.n; i++) {
+    /* set guard pages for the first n-1 regions */
+    for (i = 0; i < region.n - 1; i++) {
          void *guard;
-        int rc;

- guard = region.buf + region.size;

-        guard += i * (region.size + qemu_real_host_page_size);
-        rc = qemu_mprotect_none(guard, qemu_real_host_page_size);
+        guard = aligned + region.size + i * (region.size + page_size);
+        rc = qemu_mprotect_none(guard, page_size);
          g_assert(!rc);
      }
+    /* the last region gets the rest of the buffer */
+    rc = qemu_mprotect_none(region.end - page_size, page_size);
+    g_assert(!rc);


  for (i = region.n; i-- > 0; ) {
    void *start, *end;
    tcg_region_bounds(s, i, &start, &end);
    rc = qemu_mprotect_none(end, page_size);
    g_assert(rc == 0);
  }



r~

[Prev in Thread]

Current Thread

[Next in Thread]

[Qemu-devel] [PATCH v3 21/43] cpu-exec: lookup/generate TB outside exclusive region during step_atomic, (continued)
- [Qemu-devel] [PATCH v3 21/43] cpu-exec: lookup/generate TB outside exclusive region during step_atomic, Emilio G. Cota, 2017/07/19
- [Qemu-devel] [PATCH v3 40/43] translate-all: use qemu_protect_rwx/none helpers, Emilio G. Cota, 2017/07/19
  - Re: [Qemu-devel] [PATCH v3 40/43] translate-all: use qemu_protect_rwx/none helpers, Richard Henderson, 2017/07/20
- [Qemu-devel] [PATCH v3 43/43] tcg: enable multiple TCG contexts in softmmu, Emilio G. Cota, 2017/07/19
  - Re: [Qemu-devel] [PATCH v3 43/43] tcg: enable multiple TCG contexts in softmmu, Richard Henderson, 2017/07/20
- [Qemu-devel] [PATCH v3 38/43] util: move qemu_real_host_page_size/mask to osdep.h, Emilio G. Cota, 2017/07/19
- [Qemu-devel] [PATCH v3 27/43] translate-all: use a binary search tree to track TBs in TBContext, Emilio G. Cota, 2017/07/19
- [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer, Emilio G. Cota, 2017/07/19
  - Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer, Richard Henderson, 2017/07/20
    - Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer, Emilio G. Cota, 2017/07/20
    - Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer, Richard Henderson <=
    - Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer, Emilio G. Cota, 2017/07/20
    - Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer, Richard Henderson, 2017/07/20
- [Qemu-devel] [PATCH v3 30/43] tci: move tci_regs to tcg_qemu_tb_exec's stack, Emilio G. Cota, 2017/07/19
- [Qemu-devel] [PATCH v3 14/43] target/hppa: check CF_PARALLEL instead of parallel_cpus, Emilio G. Cota, 2017/07/19
- [Qemu-devel] [PATCH v3 36/43] tcg: introduce **tcg_ctxs to keep track of all TCGContext's, Emilio G. Cota, 2017/07/19
  - Re: [Qemu-devel] [PATCH v3 36/43] tcg: introduce **tcg_ctxs to keep track of all TCGContext's, Richard Henderson, 2017/07/20
- [Qemu-devel] [PATCH v3 31/43] tcg: take tb_ctx out of TCGContext, Emilio G. Cota, 2017/07/19
- [Qemu-devel] [PATCH v3 39/43] osdep: introduce qemu_mprotect_rwx/none, Emilio G. Cota, 2017/07/19
  - Re: [Qemu-devel] [PATCH v3 39/43] osdep: introduce qemu_mprotect_rwx/none, Richard Henderson, 2017/07/20
- [Qemu-devel] [PATCH v3 41/43] tcg: define TCG_HIGHWATER, Emilio G. Cota, 2017/07/19

Prev by Date: Re: [Qemu-devel] [PATCH for-2.10] util/oslib-posix.c: Avoid warning on NetBSD
Next by Date: Re: [Qemu-devel] [PATCH for-2.10] Use qemu_tolower() and qemu_toupper(), not tolower() and toupper()
Previous by thread: Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer
Next by thread: Re: [Qemu-devel] [PATCH v3 42/43] tcg: introduce regions to split code_gen_buffer
Index(es):
- Date
- Thread