Use a functional red-black tree for indexing the shapes
This is an experimental commit that uses a functional red-black tree to create an index of the ancestor shapes. It uses an Okasaki style functional red black tree: https://www.cs.tufts.edu/comp/150FP/archive/chris-okasaki/redblack99.pdf This tree is advantageous because: * It offers O(n log n) insertions and O(n log n) lookups. * It shares memory with previous "versions" of the tree When we insert a node in the tree, only the parts of the tree that need to be rebalanced are newly allocated. Parts of the tree that don't need to be rebalanced are not reallocated, so "new trees" are able to share memory with old trees. This is in contrast to a sorted set where we would have to duplicate the set, and also resort the set on each insertion. I've added a new stat to RubyVM.stat so we can understand how the red black tree increases.
This commit is contained in:
parent
5c4978c11c
commit
84e4453436
20
benchmark/vm_ivar_ic_miss.yml
Normal file
20
benchmark/vm_ivar_ic_miss.yml
Normal file
@ -0,0 +1,20 @@
|
||||
prelude: |
|
||||
class Foo
|
||||
def initialize diverge
|
||||
if diverge
|
||||
@a = 1
|
||||
end
|
||||
|
||||
@a0 = @a1 = @a2 = @a3 = @a4 = @a5 = @a6 = @a7 = @a8 = @a9 = @a10 = @a11 = @a12 = @a13 = @a14 = @a15 = @a16 = @a17 = @a18 = @a19 = @a20 = @a21 = @a22 = @a23 = @a24 = @a25 = @a26 = @a27 = @a28 = @a29 = @a30 = @a31 = @a32 = @a33 = @a34 = @a35 = @a36 = @a37 = @a38 = @a39 = @a40 = @a41 = @a42 = @a43 = @a44 = @a45 = @a46 = @a47 = @a48 = @a49 = @a50 = @a51 = @a52 = @a53 = @a54 = @a55 = @a56 = @a57 = @a58 = @a59 = @a60 = @a61 = @a62 = @a63 = @a64 = @a65 = @a66 = @a67 = @a68 = @a69 = @a70 = @a71 = @a72 = @a73 = @a74 = @b = 1
|
||||
end
|
||||
|
||||
def b; @b; end
|
||||
end
|
||||
|
||||
a = Foo.new false
|
||||
b = Foo.new true
|
||||
benchmark:
|
||||
vm_ivar_ic_miss: |
|
||||
a.b
|
||||
b.b
|
||||
loop_count: 30000000
|
@ -1483,6 +1483,7 @@ module RubyVM::RJIT # :nodoc: all
|
||||
type: [CType::Immediate.parse("uint8_t"), Primitive.cexpr!("OFFSETOF((*((struct rb_shape *)NULL)), type)")],
|
||||
size_pool_index: [CType::Immediate.parse("uint8_t"), Primitive.cexpr!("OFFSETOF((*((struct rb_shape *)NULL)), size_pool_index)")],
|
||||
parent_id: [self.shape_id_t, Primitive.cexpr!("OFFSETOF((*((struct rb_shape *)NULL)), parent_id)")],
|
||||
ancestor_index: [CType::Pointer.new { self.redblack_node_t }, Primitive.cexpr!("OFFSETOF((*((struct rb_shape *)NULL)), ancestor_index)")],
|
||||
)
|
||||
end
|
||||
|
||||
@ -1641,6 +1642,10 @@ module RubyVM::RJIT # :nodoc: all
|
||||
CType::Bool.new
|
||||
end
|
||||
|
||||
def C.redblack_node_t
|
||||
CType::Stub.new(:redblack_node_t)
|
||||
end
|
||||
|
||||
def C.ccan_list_node
|
||||
CType::Stub.new(:ccan_list_node)
|
||||
end
|
||||
|
309
shape.c
309
shape.c
@ -11,6 +11,10 @@
|
||||
#include "variable.h"
|
||||
#include <stdbool.h>
|
||||
|
||||
#ifndef _WIN32
|
||||
#include <sys/mman.h>
|
||||
#endif
|
||||
|
||||
#ifndef SHAPE_DEBUG
|
||||
#define SHAPE_DEBUG (VM_CHECK_MODE > 0)
|
||||
#endif
|
||||
@ -20,11 +24,235 @@
|
||||
#define SINGLE_CHILD_MASK (~((uintptr_t)SINGLE_CHILD_TAG))
|
||||
#define SINGLE_CHILD_P(x) (((uintptr_t)x) & SINGLE_CHILD_TAG)
|
||||
#define SINGLE_CHILD(x) (rb_shape_t *)((uintptr_t)x & SINGLE_CHILD_MASK)
|
||||
#define ANCESTOR_CACHE_THRESHOLD 10
|
||||
|
||||
static ID id_frozen;
|
||||
static ID id_t_object;
|
||||
static ID size_pool_edge_names[SIZE_POOL_COUNT];
|
||||
|
||||
#define LEAF 0
|
||||
#define BLACK 0x0
|
||||
#define RED 0x1
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_left(redblack_node_t * node)
|
||||
{
|
||||
if (node->l == LEAF) {
|
||||
return LEAF;
|
||||
}
|
||||
else {
|
||||
RUBY_ASSERT(node->l < GET_SHAPE_TREE()->cache_size);
|
||||
redblack_node_t * left = &GET_SHAPE_TREE()->shape_cache[node->l - 1];
|
||||
return left;
|
||||
}
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_right(redblack_node_t * node)
|
||||
{
|
||||
if (node->r == LEAF) {
|
||||
return LEAF;
|
||||
}
|
||||
else {
|
||||
RUBY_ASSERT(node->r < GET_SHAPE_TREE()->cache_size);
|
||||
redblack_node_t * right = &GET_SHAPE_TREE()->shape_cache[node->r - 1];
|
||||
return right;
|
||||
}
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_find(redblack_node_t * tree, ID key)
|
||||
{
|
||||
if (tree != LEAF) {
|
||||
if (tree->key == key) {
|
||||
return tree;
|
||||
}
|
||||
else {
|
||||
if (key < tree->key) {
|
||||
return redblack_find(redblack_left(tree), key);
|
||||
}
|
||||
else {
|
||||
return redblack_find(redblack_right(tree), key);
|
||||
}
|
||||
}
|
||||
}
|
||||
else {
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
|
||||
static inline char
|
||||
redblack_color(redblack_node_t * node)
|
||||
{
|
||||
return node && ((uintptr_t)node->value & RED);
|
||||
}
|
||||
|
||||
static inline bool
|
||||
redblack_red_p(redblack_node_t * node)
|
||||
{
|
||||
return redblack_color(node) == RED;
|
||||
}
|
||||
|
||||
static inline rb_shape_t *
|
||||
redblack_value(redblack_node_t * node)
|
||||
{
|
||||
// Color is stored in the bottom bit of the shape pointer
|
||||
// Mask away the bit so we get the actual pointer back
|
||||
return (rb_shape_t *)((uintptr_t)node->value & (((uintptr_t)-1) - 1));
|
||||
}
|
||||
|
||||
static redblack_id_t
|
||||
redblack_id_for(redblack_node_t * node)
|
||||
{
|
||||
RUBY_ASSERT(node || node == LEAF);
|
||||
if (node == LEAF) {
|
||||
return 0;
|
||||
}
|
||||
else {
|
||||
redblack_node_t * redblack_nodes = GET_SHAPE_TREE()->shape_cache;
|
||||
redblack_id_t id = (redblack_id_t)(node - redblack_nodes);
|
||||
return id + 1;
|
||||
}
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_new(char color, ID key, rb_shape_t * value, redblack_node_t * left, redblack_node_t * right)
|
||||
{
|
||||
redblack_node_t * redblack_nodes = GET_SHAPE_TREE()->shape_cache;
|
||||
redblack_node_t * node = &redblack_nodes[(GET_SHAPE_TREE()->cache_size)++];
|
||||
node->key = key;
|
||||
node->value = (rb_shape_t *)((uintptr_t)value | color);
|
||||
node->l = redblack_id_for(left);
|
||||
node->r = redblack_id_for(right);
|
||||
return node;
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_balance(char color, ID key, rb_shape_t * value, redblack_node_t * left, redblack_node_t * right)
|
||||
{
|
||||
if (color == BLACK) {
|
||||
ID z, y, x;
|
||||
rb_shape_t * z_, * y_, * x_;
|
||||
redblack_node_t * a, * b, * c, * d;
|
||||
|
||||
if (redblack_red_p(left) && redblack_red_p(redblack_left(left))) {
|
||||
z = key;
|
||||
z_ = value;
|
||||
d = right;
|
||||
|
||||
y = left->key;
|
||||
y_ = redblack_value(left);
|
||||
c = redblack_right(left);
|
||||
|
||||
x = redblack_left(left)->key;
|
||||
x_ = redblack_value(redblack_left(left));
|
||||
|
||||
a = redblack_left(redblack_left(left));
|
||||
b = redblack_right(redblack_left(left));
|
||||
}
|
||||
else if (redblack_red_p(left) && redblack_red_p(redblack_right(left))) {
|
||||
z = key;
|
||||
z_ = value;
|
||||
d = right;
|
||||
|
||||
x = left->key;
|
||||
x_ = redblack_value(left);
|
||||
a = redblack_left(left);
|
||||
|
||||
y = redblack_right(left)->key;
|
||||
y_ = redblack_value(redblack_right(left));
|
||||
b = redblack_left(redblack_right(left));
|
||||
c = redblack_right(redblack_right(left));
|
||||
}
|
||||
else if (redblack_red_p(right) && redblack_red_p(redblack_left(right))) {
|
||||
x = key;
|
||||
x_ = value;
|
||||
a = left;
|
||||
|
||||
z = right->key;
|
||||
z_ = redblack_value(right);
|
||||
d = redblack_right(right);
|
||||
|
||||
y = redblack_left(right)->key;
|
||||
y_ = redblack_value(redblack_left(right));
|
||||
b = redblack_left(redblack_left(right));
|
||||
c = redblack_right(redblack_left(right));
|
||||
}
|
||||
else if (redblack_red_p(right) && redblack_red_p(redblack_right(right))) {
|
||||
x = key;
|
||||
x_ = value;
|
||||
a = left;
|
||||
|
||||
y = right->key;
|
||||
y_ = redblack_value(right);
|
||||
b = redblack_left(right);
|
||||
|
||||
z = redblack_right(right)->key;
|
||||
z_ = redblack_value(redblack_right(right));
|
||||
c = redblack_left(redblack_right(right));
|
||||
d = redblack_right(redblack_right(right));
|
||||
}
|
||||
else {
|
||||
return redblack_new(color, key, value, left, right);
|
||||
}
|
||||
return redblack_new(
|
||||
RED, y, y_,
|
||||
redblack_new(BLACK, x, x_, a, b),
|
||||
redblack_new(BLACK, z, z_, c, d));
|
||||
}
|
||||
|
||||
return redblack_new(color, key, value, left, right);
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_insert_aux(redblack_node_t * tree, ID key, rb_shape_t * value)
|
||||
{
|
||||
if (tree == LEAF) {
|
||||
return redblack_new(RED, key, value, LEAF, LEAF);
|
||||
}
|
||||
else {
|
||||
if (key < tree->key) {
|
||||
return redblack_balance(redblack_color(tree),
|
||||
tree->key,
|
||||
redblack_value(tree),
|
||||
redblack_insert_aux(redblack_left(tree), key, value),
|
||||
redblack_right(tree));
|
||||
}
|
||||
else {
|
||||
if (key > tree->key) {
|
||||
return redblack_balance(redblack_color(tree),
|
||||
tree->key,
|
||||
redblack_value(tree),
|
||||
redblack_left(tree),
|
||||
redblack_insert_aux(redblack_right(tree), key, value));
|
||||
}
|
||||
else {
|
||||
return tree;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_force_black(redblack_node_t * node)
|
||||
{
|
||||
node->value = redblack_value(node);
|
||||
return node;
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_insert(redblack_node_t * tree, ID key, rb_shape_t * value)
|
||||
{
|
||||
redblack_node_t * root = redblack_insert_aux(tree, key, value);
|
||||
|
||||
if (redblack_red_p(root)) {
|
||||
return redblack_force_black(root);
|
||||
}
|
||||
else {
|
||||
return root;
|
||||
}
|
||||
}
|
||||
|
||||
rb_shape_tree_t *rb_shape_tree_ptr = NULL;
|
||||
|
||||
/*
|
||||
@ -152,6 +380,34 @@ rb_shape_alloc(ID edge_name, rb_shape_t * parent, enum shape_type type)
|
||||
return shape;
|
||||
}
|
||||
|
||||
static redblack_node_t *
|
||||
redblack_cache_ancestors(rb_shape_t * shape)
|
||||
{
|
||||
if (shape->ancestor_index) {
|
||||
return shape->ancestor_index;
|
||||
}
|
||||
else {
|
||||
if (shape->parent_id == INVALID_SHAPE_ID) {
|
||||
// We're at the root
|
||||
return shape->ancestor_index;
|
||||
}
|
||||
else {
|
||||
redblack_node_t * parent_index;
|
||||
|
||||
parent_index = redblack_cache_ancestors(rb_shape_get_parent(shape));
|
||||
|
||||
if (shape->type == SHAPE_IVAR) {
|
||||
shape->ancestor_index = redblack_insert(parent_index, shape->edge_name, shape);
|
||||
}
|
||||
else {
|
||||
shape->ancestor_index = parent_index;
|
||||
}
|
||||
|
||||
return shape->ancestor_index;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static rb_shape_t *
|
||||
rb_shape_alloc_new_child(ID id, rb_shape_t * shape, enum shape_type shape_type)
|
||||
{
|
||||
@ -160,6 +416,9 @@ rb_shape_alloc_new_child(ID id, rb_shape_t * shape, enum shape_type shape_type)
|
||||
switch (shape_type) {
|
||||
case SHAPE_IVAR:
|
||||
new_shape->next_iv_index = shape->next_iv_index + 1;
|
||||
if (new_shape->next_iv_index > ANCESTOR_CACHE_THRESHOLD) {
|
||||
redblack_cache_ancestors(new_shape);
|
||||
}
|
||||
break;
|
||||
case SHAPE_CAPACITY_CHANGE:
|
||||
case SHAPE_FROZEN:
|
||||
@ -443,23 +702,37 @@ rb_shape_get_iv_index(rb_shape_t * shape, ID id, attr_index_t *value)
|
||||
RUBY_ASSERT(rb_shape_id(shape) != OBJ_TOO_COMPLEX_SHAPE_ID);
|
||||
|
||||
while (shape->parent_id != INVALID_SHAPE_ID) {
|
||||
if (shape->edge_name == id) {
|
||||
enum shape_type shape_type;
|
||||
shape_type = (enum shape_type)shape->type;
|
||||
|
||||
switch (shape_type) {
|
||||
case SHAPE_IVAR:
|
||||
RUBY_ASSERT(shape->next_iv_index > 0);
|
||||
// Try the ancestor cache if it's available
|
||||
if (shape->ancestor_index && shape->next_iv_index >= ANCESTOR_CACHE_THRESHOLD) {
|
||||
redblack_node_t * node = redblack_find(shape->ancestor_index, id);
|
||||
if (node) {
|
||||
rb_shape_t * shape = redblack_value(node);
|
||||
*value = shape->next_iv_index - 1;
|
||||
return true;
|
||||
case SHAPE_CAPACITY_CHANGE:
|
||||
case SHAPE_ROOT:
|
||||
case SHAPE_INITIAL_CAPACITY:
|
||||
case SHAPE_T_OBJECT:
|
||||
}
|
||||
else {
|
||||
return false;
|
||||
case SHAPE_OBJ_TOO_COMPLEX:
|
||||
case SHAPE_FROZEN:
|
||||
rb_bug("Ivar should not exist on transition");
|
||||
}
|
||||
}
|
||||
else {
|
||||
if (shape->edge_name == id) {
|
||||
enum shape_type shape_type;
|
||||
shape_type = (enum shape_type)shape->type;
|
||||
|
||||
switch (shape_type) {
|
||||
case SHAPE_IVAR:
|
||||
RUBY_ASSERT(shape->next_iv_index > 0);
|
||||
*value = shape->next_iv_index - 1;
|
||||
return true;
|
||||
case SHAPE_CAPACITY_CHANGE:
|
||||
case SHAPE_ROOT:
|
||||
case SHAPE_INITIAL_CAPACITY:
|
||||
case SHAPE_T_OBJECT:
|
||||
return false;
|
||||
case SHAPE_OBJ_TOO_COMPLEX:
|
||||
case SHAPE_FROZEN:
|
||||
rb_bug("Ivar should not exist on transition");
|
||||
}
|
||||
}
|
||||
}
|
||||
shape = rb_shape_get_parent(shape);
|
||||
@ -820,6 +1093,12 @@ Init_default_shapes(void)
|
||||
id_frozen = rb_make_internal_id();
|
||||
id_t_object = rb_make_internal_id();
|
||||
|
||||
#ifdef HAVE_MMAP
|
||||
rb_shape_tree_ptr->shape_cache = (redblack_node_t *)mmap(NULL, rb_size_mul_or_raise(SHAPE_BUFFER_SIZE * 32, sizeof(redblack_node_t), rb_eRuntimeError),
|
||||
PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
|
||||
rb_shape_tree_ptr->cache_size = 0;
|
||||
#endif
|
||||
|
||||
// Shapes by size pool
|
||||
for (int i = 0; i < SIZE_POOL_COUNT; i++) {
|
||||
size_pool_edge_names[i] = rb_make_internal_id();
|
||||
@ -839,6 +1118,7 @@ Init_default_shapes(void)
|
||||
rb_shape_t * new_shape = rb_shape_transition_shape_capa_create(root, capa);
|
||||
new_shape->type = SHAPE_INITIAL_CAPACITY;
|
||||
new_shape->size_pool_index = i;
|
||||
new_shape->ancestor_index = LEAF;
|
||||
RUBY_ASSERT(rb_shape_id(new_shape) == (shape_id_t)i);
|
||||
}
|
||||
|
||||
@ -849,6 +1129,7 @@ Init_default_shapes(void)
|
||||
rb_shape_t * t_object_shape =
|
||||
get_next_shape_internal(shape, id_t_object, SHAPE_T_OBJECT, &dont_care, true, false);
|
||||
t_object_shape->edges = rb_id_table_create(0);
|
||||
t_object_shape->ancestor_index = LEAF;
|
||||
RUBY_ASSERT(rb_shape_id(t_object_shape) == (shape_id_t)(i + SIZE_POOL_COUNT));
|
||||
}
|
||||
|
||||
|
15
shape.h
15
shape.h
@ -17,10 +17,12 @@ typedef uint16_t attr_index_t;
|
||||
|
||||
#if SIZEOF_SHAPE_T == 4
|
||||
typedef uint32_t shape_id_t;
|
||||
typedef uint32_t redblack_id_t;
|
||||
# define SHAPE_ID_NUM_BITS 32
|
||||
# define SHAPE_BUFFER_SIZE 0x80000
|
||||
#else
|
||||
typedef uint16_t shape_id_t;
|
||||
typedef uint16_t redblack_id_t;
|
||||
# define SHAPE_ID_NUM_BITS 16
|
||||
# define SHAPE_BUFFER_SIZE 0x8000
|
||||
#endif
|
||||
@ -40,6 +42,8 @@ typedef uint16_t shape_id_t;
|
||||
# define SPECIAL_CONST_SHAPE_ID (SIZE_POOL_COUNT * 2)
|
||||
# define OBJ_TOO_COMPLEX_SHAPE_ID (SPECIAL_CONST_SHAPE_ID + 1)
|
||||
|
||||
typedef struct redblack_node redblack_node_t;
|
||||
|
||||
struct rb_shape {
|
||||
struct rb_id_table * edges; // id_table from ID (ivar) to next shape
|
||||
ID edge_name; // ID (ivar) for transition from parent to rb_shape
|
||||
@ -48,10 +52,18 @@ struct rb_shape {
|
||||
uint8_t type;
|
||||
uint8_t size_pool_index;
|
||||
shape_id_t parent_id;
|
||||
redblack_node_t * ancestor_index;
|
||||
};
|
||||
|
||||
typedef struct rb_shape rb_shape_t;
|
||||
|
||||
struct redblack_node {
|
||||
ID key;
|
||||
rb_shape_t * value;
|
||||
redblack_id_t l;
|
||||
redblack_id_t r;
|
||||
};
|
||||
|
||||
enum shape_type {
|
||||
SHAPE_ROOT,
|
||||
SHAPE_IVAR,
|
||||
@ -67,6 +79,9 @@ typedef struct {
|
||||
rb_shape_t *shape_list;
|
||||
rb_shape_t *root_shape;
|
||||
shape_id_t next_shape_id;
|
||||
|
||||
redblack_node_t *shape_cache;
|
||||
unsigned int cache_size;
|
||||
} rb_shape_tree_t;
|
||||
RUBY_EXTERN rb_shape_tree_t *rb_shape_tree_ptr;
|
||||
|
||||
|
8
vm.c
8
vm.c
@ -633,6 +633,8 @@ rb_dtrace_setup(rb_execution_context_t *ec, VALUE klass, ID id,
|
||||
return FALSE;
|
||||
}
|
||||
|
||||
extern unsigned int redblack_buffer_size;
|
||||
|
||||
/*
|
||||
* call-seq:
|
||||
* RubyVM.stat -> Hash
|
||||
@ -660,6 +662,7 @@ static VALUE
|
||||
vm_stat(int argc, VALUE *argv, VALUE self)
|
||||
{
|
||||
static VALUE sym_constant_cache_invalidations, sym_constant_cache_misses, sym_global_cvar_state, sym_next_shape_id;
|
||||
static VALUE sym_shape_cache_size;
|
||||
VALUE arg = Qnil;
|
||||
VALUE hash = Qnil, key = Qnil;
|
||||
|
||||
@ -681,6 +684,7 @@ vm_stat(int argc, VALUE *argv, VALUE self)
|
||||
S(constant_cache_misses);
|
||||
S(global_cvar_state);
|
||||
S(next_shape_id);
|
||||
S(shape_cache_size);
|
||||
#undef S
|
||||
|
||||
#define SET(name, attr) \
|
||||
@ -693,6 +697,7 @@ vm_stat(int argc, VALUE *argv, VALUE self)
|
||||
SET(constant_cache_misses, ruby_vm_constant_cache_misses);
|
||||
SET(global_cvar_state, ruby_vm_global_cvar_state);
|
||||
SET(next_shape_id, (rb_serial_t)GET_SHAPE_TREE()->next_shape_id);
|
||||
SET(shape_cache_size, (rb_serial_t)GET_SHAPE_TREE()->cache_size);
|
||||
#undef SET
|
||||
|
||||
#if USE_DEBUG_COUNTER
|
||||
@ -3069,7 +3074,8 @@ vm_memsize(const void *ptr)
|
||||
vm_memsize_builtin_function_table(vm->builtin_function_table) +
|
||||
rb_id_table_memsize(vm->negative_cme_table) +
|
||||
rb_st_memsize(vm->overloaded_cme_table) +
|
||||
vm_memsize_constant_cache()
|
||||
vm_memsize_constant_cache() +
|
||||
GET_SHAPE_TREE()->cache_size * sizeof(redblack_node_t)
|
||||
);
|
||||
|
||||
// TODO
|
||||
|
Loading…
x
Reference in New Issue
Block a user