dce · April 1, 2013 11:55
diff --git a/main.c b/main.c
 // https://github.com/josephg/librope

 #include <stdlib.h>
 #include <stdio.h>

 #include "rope.h"

 int
 main()
 {
    uint8_t *str;

    rope *r = rope_new();

    rope_insert(r, 0, "Hello, World!");
    str = malloc(rope_byte_count(r));
    rope_write_cstr(r, str);
    printf("%s\n", str);
    free(str);

    rope_del(r, 5, 7);
    str = malloc(rope_byte_count(r));
    rope_write_cstr(r, str);
    printf("%s\n", str);
    free(str);

    rope_insert(r, 5, ", Pootrick");
    str = malloc(rope_byte_count(r));
    rope_write_cstr(r, str);
    printf("%s\n", str);
    free(str);

    rope_free(r);

    return 0;
 }
diff --git a/Makefile b/Makefile
 CFLAGS = -g -Wall -Wextra

 all:
 	make rope
 	gcc -o main main.c rope.o

 rope:
 	gcc -o rope.o -c rope.c

 clean:
 	rm -rf main *.dSYM rope.o
diff --git a/rope.c b/rope.c
 // Implementation for rope library.

 #include <stdlib.h>
 #include <string.h>

 // Needed for VC++, which always compiles in C++ mode and doesn't have stdbool.
 #ifndef __cplusplus
 #include <stdbool.h>
 #endif

 #include <assert.h>
 #include "rope.h"

 // The number of bytes the rope head structure takes up
 static const size_t ROPE_SIZE = sizeof(rope) + sizeof(rope_node) * ROPE_MAX_HEIGHT;

 // Create a new rope with no contents
 rope *rope_new2(void *(*alloc)(size_t bytes),
                void *(*realloc)(void *ptr, size_t newsize),
                void (*free)(void *ptr)) {
  rope *r = (rope *)alloc(ROPE_SIZE);
  r->num_chars = r->num_bytes = 0;
  
  r->alloc = alloc;
  r->realloc = realloc;
  r->free = free;
  
  r->head.height = 1;
  r->head.num_bytes = 0;
  r->head.nexts[0].node = NULL;
  r->head.nexts[0].skip_size = 0;
 #if ROPE_WCHAR
  r->head.nexts[0].wchar_size = 0;
 #endif
  return r;
 }

 rope *rope_new() {
  return rope_new2(malloc, realloc, free);
 }

 // Create a new rope containing the specified string
 rope *rope_new_with_utf8(const uint8_t *str) {
  rope *r = rope_new();
  rope_insert(r, 0, str);
  return r;
 }

 rope *rope_copy(const rope *other) {
  int i;
  rope_node *n;
  rope *r = (rope *)other->alloc(ROPE_SIZE);
  
  // Just copy most of the head's data. Note this won't copy the nexts list in head.
  *r = *other;
  
  rope_node *nodes[ROPE_MAX_HEIGHT];

  for (i = 0; i < other->head.height; i++) {
    nodes[i] = &r->head;
    // non-NULL next pointers will be rewritten below.
    r->head.nexts[i] = other->head.nexts[i];
  }
  
  for (n = other->head.nexts[0].node; n != NULL; n = n->nexts[0].node) {
    unsigned int i;
    // I wonder if it would be faster if we took this opportunity to rebalance the node list..?
    size_t h = n->height;
    rope_node *n2 = (rope_node *)r->alloc(sizeof(rope_node) + h * sizeof(rope_skip_node));
    
    // Would it be faster to just *n2 = *n; ?
    n2->num_bytes = n->num_bytes;
    n2->height = h;
    memcpy(n2->str, n->str, n->num_bytes);
    memcpy(n2->nexts, n->nexts, h * sizeof(rope_skip_node));
    
    for (i = 0; i < h; i++) {
      nodes[i]->nexts[i].node = n2;
      nodes[i] = n2;
    }
  }
  
  return r;
 }

 // Free the specified rope
 void rope_free(rope *r) {
  assert(r);
  rope_node *next, *n;
  
  for (n = r->head.nexts[0].node; n != NULL; n = next) {
    next = n->nexts[0].node;
    r->free(n);
  }
  
  r->free(r);
 }

 // Get the number of characters in a rope
 size_t rope_char_count(rope *r) {
  assert(r);
  return r->num_chars;
 }

 // Get the number of bytes which the rope would take up if stored as a utf8
 // string
 size_t rope_byte_count(rope *r) {
  assert(r);
  return r->num_bytes;
 }

 // Copies the rope's contents into a utf8 encoded C string. Also copies a trailing '\0' character.
 // Returns the number of bytes written, which is rope_byte_count(r) + 1.
 size_t rope_write_cstr(rope *r, uint8_t *dest) {
  rope_node *n;
  size_t num_bytes = rope_byte_count(r);
  dest[num_bytes] = '\0';
  
  if (num_bytes) {
    uint8_t *p = dest;
    for (n = &r->head; n != NULL; n = n->nexts[0].node) {
      memcpy(p, n->str, n->num_bytes);
      p += n->num_bytes;
    }
    
    assert(p == &dest[num_bytes]);
  }
  return num_bytes + 1;
 }

 // Create a new C string which contains the rope. The string will contain
 // the rope encoded as utf8.
 uint8_t *rope_create_cstr(rope *r) {
  uint8_t *bytes = (uint8_t *)r->alloc(rope_byte_count(r) + 1); // Room for a zero.
  rope_write_cstr(r, bytes);
  return bytes;
 }

 #if ROPE_WCHAR
 size_t rope_wchar_count(rope *r) {
  assert(r);
  return r->head.nexts[r->head.height - 1].wchar_size;
 }
 #endif

 #define MIN(x,y) ((x) > (y) ? (y) : (x))
 #define MAX(x,y) ((x) > (y) ? (x) : (y))

 #ifdef _WIN32
 inline static long random() {
  return rand();
 }
 #endif

 static uint8_t random_height() {
  // This function is horribly inefficient. I'm throwing away heaps of entropy, and
  // the mod could be replaced by some clever shifting.
  //
  // However, random_height barely appears in the profiler output - so its probably
  // not worth investing the time to optimise.

  uint8_t height = 1;
  
  // The root node's height is the height of the largest node + 1, so the largest
  // node can only have ROPE_MAX_HEIGHT - 1.
  while(height < (ROPE_MAX_HEIGHT - 1) && (random() % 100) < ROPE_BIAS) {
    height++;
  }
  
  return height;
 }

 // Figure out how many bytes to allocate for a node with the specified height.
 static size_t node_size(uint8_t height) {
  return sizeof(rope_node) + height * sizeof(rope_skip_node);
 }

 // Allocate and return a new node. The new node will be full of junk, except
 // for its height.
 // This function should be replaced at some point with an object pool based version.
 static rope_node *alloc_node(rope *r, uint8_t height) {
  rope_node *node = (rope_node *)r->alloc(node_size(height));
  node->height = height;
  return node;
 }

 // Find out how many bytes the unicode character which starts with the specified byte
 // will occupy in memory.
 // Returns the number of bytes, or SIZE_MAX if the byte is invalid.
 static inline size_t codepoint_size(uint8_t byte) {
  if (byte <= 0x7f) { return 1; } // 0x74 = 0111 1111
  else if (byte <= 0xbf) { return SIZE_MAX; } // 1011 1111. Invalid for a starting byte.
  else if (byte <= 0xdf) { return 2; } // 1101 1111
  else if (byte <= 0xef) { return 3; } // 1110 1111
  else if (byte <= 0xf7) { return 4; } // 1111 0111
  else if (byte <= 0xfb) { return 5; } // 1111 1011
  else if (byte <= 0xfd) { return 6; } // 1111 1101
  else { return SIZE_MAX; }
 }

 // This little function counts how many bytes a certain number of characters take up.
 static size_t count_bytes_in_utf8(const uint8_t *str, size_t num_chars) {
  unsigned int i;
  const uint8_t *p = str;
  for (i = 0; i < num_chars; i++) {
    p += codepoint_size(*p);
  }
  return p - str;
 }

 #if ROPE_WCHAR

 #define NEEDS_TWO_WCHARS(x) (((x) & 0xf0) == 0xf0)

 static size_t count_wchars_in_utf8(const uint8_t *str, size_t num_chars) {
  unsigned int i;
  size_t wchars = 0;
  for (i = 0; i < num_chars; i++) {
    wchars += 1 + NEEDS_TWO_WCHARS(*str);
    str += codepoint_size(*str);
  }
  return wchars;
 }

 static size_t count_utf8_in_wchars(const uint8_t *str, size_t num_wchars) {
  unsigned int i;
  size_t chars = num_wchars;
  for (i = 0; i < num_wchars; i++) {
    if (NEEDS_TWO_WCHARS(*str)) {
      chars--;
      i++;
    }
    str += codepoint_size(*str);
  }
  return chars;
 }
 #endif

 // Count the number of characters in a string.
 static size_t strlen_utf8(const uint8_t *str) {
  const uint8_t *p = str;
  size_t i = 0;
  while (*p) {
    p += codepoint_size(*p);
    i++;
  }
  return i;
 }

 typedef struct {
  // This stores the previous node at each height, and the number of characters from the start of
  // the previous node to the current iterator position.
  rope_skip_node s[ROPE_MAX_HEIGHT];
 } rope_iter;

 // Internal function for navigating to a particular character offset in the rope.
 // The function returns the list of nodes which point past the position, as well as
 // offsets of how far into their character lists the specified characters are.
 static rope_node *iter_at_char_pos(rope *r, size_t char_pos, rope_iter *iter) {
  assert(char_pos <= r->num_chars);

  rope_node *e = &r->head;
  int height = r->head.height - 1;

  // Offset stores how many characters we still need to skip in the current node.
  size_t offset = char_pos;
  size_t skip;
 #if ROPE_WCHAR
  size_t wchar_pos = 0; // Current wchar pos from the start of the rope.
 #endif

  while (true) {
    skip = e->nexts[height].skip_size;
    if (offset > skip) {
      // Go right.
      assert(e == &r->head || e->num_bytes);
      
      offset -= skip;
 #if ROPE_WCHAR
      wchar_pos += e->nexts[height].wchar_size;
 #endif
      e = e->nexts[height].node;
    } else {
      // Go down.
      iter->s[height].skip_size = offset;
      iter->s[height].node = e;
 #if ROPE_WCHAR
      iter->s[height].wchar_size = wchar_pos;
 #endif

      if (height == 0) {
        break;
      } else {
        height--;
      }
    }
  }
  
 #if ROPE_WCHAR
  int i;

  // For some reason, this is _REALLY SLOW_. Like, 5.5Mops/s -> 4Mops/s from this block of code.
  wchar_pos += count_wchars_in_utf8(e->str, offset);
  
  // The iterator has the wchar pos from the start of the whole string.
  for (i = 0; i < r->head.height; i++) {
    iter->s[i].wchar_size = wchar_pos - iter->s[i].wchar_size;
  }
 #endif
  
  assert(offset <= ROPE_NODE_STR_SIZE);
  assert(iter->s[0].node == e);
  return e;
 }

 #if ROPE_WCHAR
 // Equivalent of iter_at_char_pos, but for wchar positions instead.
 static rope_node *iter_at_wchar_pos(rope *r, size_t wchar_pos, rope_iter *iter) {
  int i;
  int height = r->head.height - 1;
  assert(wchar_pos <= r->head.nexts[height].wchar_size);

  rope_node *e = &r->head;

  // Offset stores how many wchar characters we still need to skip in the current node.
  size_t offset = wchar_pos;
  size_t skip;
  size_t char_pos = 0; // Current char pos from the start of the rope.
  
  while (true) {
    skip = e->nexts[height].wchar_size;
    if (offset > skip) {
      // Go right.
      offset -= skip;
      char_pos += e->nexts[height].skip_size;
      e = e->nexts[height].node;
    } else {
      // Go down.
      iter->s[height].skip_size = char_pos;
      iter->s[height].node = e;
      iter->s[height].wchar_size = offset;
      
      if (height == 0) {
        break;
      } else {
        height--;
      }
    }
  }

  char_pos += count_utf8_in_wchars(e->str, offset);
  
  // The iterator has character positions from the start of the rope to the start of the node.
  for (i = 0; i < r->head.height; i++) {
    iter->s[i].skip_size = char_pos - iter->s[i].skip_size;
  }
  assert(e == iter->s[0].node);
  return e;
 }
 #endif

 #if ROPE_WCHAR
 static void update_offset_list(rope *r, rope_iter *iter, size_t num_chars, size_t num_wchars) {
  int i;

  for (i = 0; i < r->head.height; i++) {
    iter->s[i].node->nexts[i].skip_size += num_chars;
    iter->s[i].node->nexts[i].wchar_size += num_wchars;
  }
 }
 #else
 static void update_offset_list(rope *r, rope_iter *iter, size_t num_chars) {
  int i;

  for (i = 0; i < r->head.height; i++) {
    iter->s[i].node->nexts[i].skip_size += num_chars;
  }
 }
 #endif


 // Internal method of rope_insert.
 // This function creates a new node in the rope at the specified position and fills it with the
 // passed string.
 static void insert_at(rope *r, rope_iter *iter,
    const uint8_t *str, size_t num_bytes, size_t num_chars) {
 #if ROPE_WCHAR
  size_t num_wchars = count_wchars_in_utf8(str, num_chars);
 #endif
  
  // This describes how many levels of the iter are filled in.
  uint8_t max_height = r->head.height;
  uint8_t new_height = random_height();
  rope_node *new_node = alloc_node(r, new_height);
  new_node->num_bytes = num_bytes;
  memcpy(new_node->str, str, num_bytes);

  assert(new_height < ROPE_MAX_HEIGHT);
  
  // Max height (the rope's head's height) must be 1+ the height of the largest node.
  while (max_height <= new_height) {
    r->head.height++;
    r->head.nexts[max_height] = r->head.nexts[max_height - 1];
    
    // This is the position (offset from the start) of the rope.
    iter->s[max_height] = iter->s[max_height - 1];
    max_height++;
  }

  // Fill in the new node's nexts array.
  int i;

  for (i = 0; i < new_height; i++) {
    rope_skip_node *prev_skip = &iter->s[i].node->nexts[i];
    new_node->nexts[i].node = prev_skip->node;
    new_node->nexts[i].skip_size = num_chars + prev_skip->skip_size - iter->s[i].skip_size;
    

    prev_skip->node = new_node;
    prev_skip->skip_size = iter->s[i].skip_size;
    
    // & move the iterator to the end of the newly inserted node.
    iter->s[i].node = new_node;
    iter->s[i].skip_size = num_chars;
 #if ROPE_WCHAR
    new_node->nexts[i].wchar_size = num_wchars + prev_skip->wchar_size - iter->s[i].wchar_size;
    prev_skip->wchar_size = iter->s[i].wchar_size;
    iter->s[i].wchar_size = num_wchars;
 #endif
  }
  
  for (; i < max_height; i++) {
    iter->s[i].node->nexts[i].skip_size += num_chars;
    iter->s[i].skip_size += num_chars;
 #if ROPE_WCHAR
    iter->s[i].node->nexts[i].wchar_size += num_wchars;
    iter->s[i].wchar_size += num_wchars;
 #endif
  }
  
  r->num_chars += num_chars;
  r->num_bytes += num_bytes;
 }

 // Insert the given utf8 string into the rope at the specified position.
 static void rope_insert_at_iter(rope *r, rope_node *e, rope_iter *iter, const uint8_t *str) {
  int i;

  // iter.offset contains how far (in characters) into the current element to skip.
  // Figure out how much that is in bytes.
  size_t offset_bytes = 0;
  // The insertion offset into the destination node.
  size_t offset = iter->s[0].skip_size;
  if (offset) {
    assert(offset <= e->nexts[0].skip_size);
    offset_bytes = count_bytes_in_utf8(e->str, offset);
  }
  
  // Maybe we can insert the characters into the current node?
  size_t num_inserted_bytes = strlen((char *)str);

  // Can we insert into the current node?
  bool insert_here = e->num_bytes + num_inserted_bytes <= ROPE_NODE_STR_SIZE;
  
  // Can we insert into the subsequent node?
  rope_node *next = NULL;
  if (!insert_here && offset_bytes == e->num_bytes) {
    next = e->nexts[0].node;
    // We can insert into the subsequent node if:
    // - We can't insert into the current node
    // - There _is_ a next node to insert into
    // - The insert would be at the start of the next node
    // - There's room in the next node
    if (next && next->num_bytes + num_inserted_bytes <= ROPE_NODE_STR_SIZE) {
      offset = offset_bytes = 0;
      for (i = 0; i < next->height; i++) {
        iter->s[i].node = next;
        // tree offset nodes will not be used.
      }
      e = next;

      insert_here = true;
    }
  }
  
  if (insert_here) {
    // First move the current bytes later on in the string.
    if (offset_bytes < e->num_bytes) {
      memmove(&e->str[offset_bytes + num_inserted_bytes],
              &e->str[offset_bytes],
              e->num_bytes - offset_bytes);
    }
    
    // Then copy in the string bytes
    memcpy(&e->str[offset_bytes], str, num_inserted_bytes);
    e->num_bytes += num_inserted_bytes;
    
    r->num_bytes += num_inserted_bytes;
    size_t num_inserted_chars = strlen_utf8(str);
    r->num_chars += num_inserted_chars;

    // .... aaaand update all the offset amounts.
 #if ROPE_WCHAR
    size_t num_inserted_wchars = count_wchars_in_utf8(str, num_inserted_chars);
    update_offset_list(r, iter, num_inserted_chars, num_inserted_wchars);
 #else
    update_offset_list(r, iter, num_inserted_chars);
 #endif
    
  } else {
    // There isn't room. We'll need to add at least one new node to the rope.
    
    // If we're not at the end of the current node, we'll need to remove
    // the end of the current node's data and reinsert it later.
    size_t num_end_chars, num_end_bytes = e->num_bytes - offset_bytes;
    if (num_end_bytes) {
      // We'll pretend like the character have been deleted from the node, while leaving
      // the bytes themselves there (for later).
      e->num_bytes = offset_bytes;
      num_end_chars = e->nexts[0].skip_size - offset;
 #if ROPE_WCHAR
      size_t num_end_wchars = count_wchars_in_utf8(&e->str[offset_bytes], num_end_chars);
      update_offset_list(r, iter, -num_end_chars, -num_end_wchars);
 #else
      update_offset_list(r, iter, -num_end_chars);
 #endif
      
      r->num_chars -= num_end_chars;
      r->num_bytes -= num_end_bytes;
    }
    
    // Now we insert new nodes containing the new character data. The data must be broken into
    // pieces of with a maximum size of ROPE_NODE_STR_SIZE. Node boundaries must not occur in the
    // middle of a utf8 codepoint.
    size_t str_offset = 0;
    while (str_offset < num_inserted_bytes) {
      size_t new_node_bytes = 0;
      size_t new_node_chars = 0;
      
      while (str_offset + new_node_bytes < num_inserted_bytes) {
        size_t cs = codepoint_size(str[str_offset + new_node_bytes]);
        if (cs + new_node_bytes > ROPE_NODE_STR_SIZE) {
          break;
        } else {
          new_node_bytes += cs;
          new_node_chars++;
        }
      }
      
      insert_at(r, iter, &str[str_offset], new_node_bytes, new_node_chars);
      str_offset += new_node_bytes;
    }
    
    if (num_end_bytes) {
      insert_at(r, iter, &e->str[offset_bytes], num_end_bytes, num_end_chars);
    }
  }
 }

 void rope_insert(rope *r, size_t pos, const uint8_t *str) {
  assert(r);
  assert(str);
 #ifdef DEBUG
  _rope_check(r);
 #endif
  pos = MIN(pos, r->num_chars);
  
  rope_iter iter;
  // First we need to search for the node where we'll insert the string.
  rope_node *e = iter_at_char_pos(r, pos, &iter);

  rope_insert_at_iter(r, e, &iter, str);
  
 #ifdef DEBUG
  _rope_check(r);
 #endif
 }

 #if ROPE_WCHAR
 // Insert the given utf8 string into the rope at the specified position.
 size_t rope_insert_at_wchar(rope *r, size_t wchar_pos, const uint8_t *str) {
  assert(r);
  assert(str);
 #ifdef DEBUG
  _rope_check(r);
 #endif
  wchar_pos = MIN(wchar_pos, rope_wchar_count(r));
  
  rope_iter iter;
  // First we need to search for the node where we'll insert the string.
  rope_node *e = iter_at_wchar_pos(r, wchar_pos, &iter);
  size_t pos = iter.s[r->head.height - 1].skip_size;
  rope_insert_at_iter(r, e, &iter, str);
  
 #ifdef DEBUG
  _rope_check(r);
 #endif
  return pos;
 }

 #endif

 // Delete num characters at position pos. Deleting past the end of the string
 // has no effect.
 static void rope_del_at_iter(rope *r, rope_node *e, rope_iter *iter, size_t length) {  
  r->num_chars -= length;
  size_t offset = iter->s[0].skip_size;
  while (length) {
    if (offset == e->nexts[0].skip_size) {
      // End of the current node. Skip to the start of the next one.
      e = iter->s[0].node->nexts[0].node;
      offset = 0;
    }
    
    size_t num_chars = e->nexts[0].skip_size;
    size_t removed = MIN(length, num_chars - offset);
 #if ROPE_WCHAR
    size_t removed_wchars;
 #endif
    
    int i;
    if (removed < num_chars || e == &r->head) {
      // Just trim this node down to size.
      size_t leading_bytes = count_bytes_in_utf8(e->str, offset);
      size_t removed_bytes = count_bytes_in_utf8(&e->str[leading_bytes], removed);
      size_t trailing_bytes = e->num_bytes - leading_bytes - removed_bytes;
 #if ROPE_WCHAR
      removed_wchars = count_wchars_in_utf8(&e->str[leading_bytes], removed);
 #endif
      if (trailing_bytes) {
        memmove(&e->str[leading_bytes], &e->str[leading_bytes + removed_bytes], trailing_bytes);
      }
      e->num_bytes -= removed_bytes;
      r->num_bytes -= removed_bytes;
      
      for (i = 0; i < e->height; i++) {
        e->nexts[i].skip_size -= removed;
 #if ROPE_WCHAR
        e->nexts[i].wchar_size -= removed_wchars;
 #endif
      }
    } else {
      // Remove the node from the list
 #if ROPE_WCHAR
      removed_wchars = e->nexts[0].wchar_size;
 #endif
      for (i = 0; i < e->height; i++) {
        iter->s[i].node->nexts[i].node = e->nexts[i].node;
        iter->s[i].node->nexts[i].skip_size += e->nexts[i].skip_size - removed;
 #if ROPE_WCHAR
        iter->s[i].node->nexts[i].wchar_size += e->nexts[i].wchar_size - removed_wchars;
 #endif
      }
      
      r->num_bytes -= e->num_bytes;
      // TODO: Recycle e.
      rope_node *next = e->nexts[0].node;
      r->free(e);
      e = next;
    }
    
    for (; i < r->head.height; i++) {
      iter->s[i].node->nexts[i].skip_size -= removed;
 #if ROPE_WCHAR
      iter->s[i].node->nexts[i].wchar_size -= removed_wchars;
 #endif
    }
    
    length -= removed;
  }
 }

 void rope_del(rope *r, size_t pos, size_t length) {
 #ifdef DEBUG
  _rope_check(r);
 #endif
  
  assert(r);
  pos = MIN(pos, r->num_chars);
  length = MIN(length, r->num_chars - pos);
  
  rope_iter iter;
  
  // Search for the node where we'll insert the string.
  rope_node *e = iter_at_char_pos(r, pos, &iter);
  
  rope_del_at_iter(r, e, &iter, length);
  
 #ifdef DEBUG
  _rope_check(r);
 #endif
 }

 #if ROPE_WCHAR
 size_t rope_del_at_wchar(rope *r, size_t wchar_pos, size_t wchar_num, size_t *char_len_out) {
 #ifdef DEBUG
  _rope_check(r);
 #endif
  
  assert(r);
  size_t wchar_total = rope_wchar_count(r);
  wchar_pos = MIN(wchar_pos, wchar_total);
  wchar_num = MIN(wchar_num, wchar_total - wchar_pos);
  
  rope_iter iter;
  
  // Search for the node where we'll insert the string.
  rope_node *start = iter_at_wchar_pos(r, wchar_pos, &iter);
  size_t char_pos = iter.s[r->head.height - 1].skip_size;

  rope_iter end_iter;
  int h = r->head.height - 1;
  iter_at_wchar_pos(r, iter.s[h].wchar_size + wchar_num, &end_iter);
  
  size_t char_length = end_iter.s[h].skip_size - iter.s[h].skip_size;
  rope_del_at_iter(r, start, &iter, char_length);
  
 #ifdef DEBUG
  _rope_check(r);
 #endif
  if (char_len_out) {
    *char_len_out = char_length;
  }
  return char_pos;
 }
 #endif

 void _rope_check(rope *r) {
  int i;

  assert(r->head.height); // Even empty ropes have a height of 1.
  assert(r->num_bytes >= r->num_chars);
  
  rope_skip_node skip_over = r->head.nexts[r->head.height - 1];
  assert(skip_over.skip_size == r->num_chars);
  assert(skip_over.node == NULL);

  rope_node *n;
  
  size_t num_bytes = 0;
  size_t num_chars = 0;
 #if ROPE_WCHAR
  size_t num_wchar = 0;
 #endif

  // The offsets here are used to store the total distance travelled from the start
  // of the rope.
  rope_iter iter = {};
  for (i = 0; i < r->head.height; i++) {
    iter.s[i].node = &r->head;
  }
  
  for (n = &r->head; n != NULL; n = n->nexts[0].node) {
    assert(n == &r->head || n->num_bytes);
    assert(n->height <= ROPE_MAX_HEIGHT);
    assert(count_bytes_in_utf8(n->str, n->nexts[0].skip_size) == n->num_bytes);
 #if ROPE_WCHAR
    assert(count_wchars_in_utf8(n->str, n->nexts[0].skip_size) == n->nexts[0].wchar_size);
 #endif
    for (i = 0; i < n->height; i++) {
      assert(iter.s[i].node == n);
      assert(iter.s[i].skip_size == num_chars);
      iter.s[i].node = n->nexts[i].node;
      iter.s[i].skip_size += n->nexts[i].skip_size;
 #if ROPE_WCHAR
      assert(iter.s[i].wchar_size == num_wchar);
      iter.s[i].wchar_size += n->nexts[i].wchar_size;
 #endif
    }
    
    num_bytes += n->num_bytes;
    num_chars += n->nexts[0].skip_size;
 #if ROPE_WCHAR
    num_wchar += n->nexts[0].wchar_size;
 #endif
  }
  
  for (i = 0; i < r->head.height; i++) {
    assert(iter.s[i].node == NULL);
    assert(iter.s[i].skip_size == num_chars);
 #if ROPE_WCHAR
    assert(iter.s[i].wchar_size == num_wchar);
 #endif
  }
  
  assert(r->num_bytes == num_bytes);
  assert(r->num_chars == num_chars);
 #if ROPE_WCHAR
  assert(skip_over.wchar_size == num_wchar);
 #endif
 }

 // For debugging.
 #include <stdio.h>
 void _rope_print(rope *r) {
  int i;
  rope_node *n;

  printf("chars: %zd\tbytes: %zd\theight: %d\n", r->num_chars, r->num_bytes, r->head.height);

  printf("HEAD");
  for (i = 0; i < r->head.height; i++) {
    printf(" |%3zd ", r->head.nexts[i].skip_size);
  }
  printf("\n");
  
  int num = 0;
  for (n = &r->head; n != NULL; n = n->nexts[0].node) {
    printf("%3d:", num++);
    for ( i = 0; i < n->height; i++) {
      printf(" |%3zd ", n->nexts[i].skip_size);
    }
    printf("        : \"");
    fwrite(n->str, n->num_bytes, 1, stdout);
    printf("\"\n");
  }
 }
diff --git a/rope.h b/rope.h
 /* UTF-8 Rope implementation by Joseph Gentle
 *
 * This library implements a heavyweight utf8 string type with fast
 * insert-at-position and delete-at-position operations.
 * 
 * It uses skip lists instead of trees. Trees might be faster - who knows?
 *
 * Ropes are NOT THREAD SAFE. Do not call multiple rope methods
 * simultaneously from different threads.
 */

 #ifndef librope_rope_h
 #define librope_rope_h

 #include <stdint.h>
 #include <stddef.h>

 // Whether or not the rope should support converting UTF-8 character offsets to wchar array
 // positions. This is useful when interoperating with strings in JS, Objective-C and many other
 // languages. See http://josephg.com/post/31707645955/string-length-lies
 //
 // Adding wchar conversion support decreases performance by about 30%.
 #ifndef ROPE_WCHAR
 #define ROPE_WCHAR 0
 #endif

 // These two magic values seem to be approximately optimal given the benchmark in
 // tests.c which does lots of small inserts.

 // Must be <= UINT16_MAX. Benchmarking says this is pretty close to optimal
 // (tested on a mac using clang 4.0 and x86_64).
 #ifndef ROPE_NODE_STR_SIZE
 #if ROPE_WCHAR
 #define ROPE_NODE_STR_SIZE 64
 #else
 #define ROPE_NODE_STR_SIZE 136
 #endif
 #endif

 // The likelyhood (%) a node will have height (n+1) instead of n
 #ifndef ROPE_BIAS
 #define ROPE_BIAS 25
 #endif

 // The rope will stop being efficient after the string is 2 ^ ROPE_MAX_HEIGHT nodes.
 #ifndef ROPE_MAX_HEIGHT
 #define ROPE_MAX_HEIGHT 60
 #endif

 struct rope_node_t;

 // The number of characters in str can be read out of nexts[0].skip_size.
 typedef struct {
  // The number of _characters_ between the start of the current node
  // and the start of next.
  size_t skip_size;

  // For some reason, librope runs about 1% faster when this next pointer is
  // exactly _here_ in the struct.
  struct rope_node_t *node;

 #if ROPE_WCHAR
  // The number of wide characters contained in space.
  size_t wchar_size;
 #endif
 } rope_skip_node;

 typedef struct rope_node_t {
  uint8_t str[ROPE_NODE_STR_SIZE];

  // The number of bytes in str in use
  uint16_t num_bytes;
  
  // This is the number of elements allocated in nexts.
  // Each height is 1/2 as likely as the height before. The minimum height is 1.
  uint8_t height;
  
  rope_skip_node nexts[];
 } rope_node;

 typedef struct {
  // The total number of characters in the rope.
  size_t num_chars;
  
  // The total number of bytes which the characters in the rope take up.
  size_t num_bytes;
  
  void *(*alloc)(size_t bytes);
  void *(*realloc)(void *ptr, size_t newsize);
  void (*free)(void *ptr);

  // The first node exists inline in the rope structure itself.
  rope_node head;
 } rope;

 #ifdef __cplusplus
 extern "C" {
 #endif
  
 // Create a new rope with no contents
 rope *rope_new();

 // Create a new rope using custom allocators.
 rope *rope_new2(void *(*alloc)(size_t bytes),
    void *(*realloc)(void *ptr, size_t newsize),
    void (*free)(void *ptr));

 // Create a new rope containing a copy of the given string. Shorthand for
 // r = rope_new(); rope_insert(r, 0, str);
 rope *rope_new_with_utf8(const uint8_t *str);

 // Make a copy of an existing rope
 rope *rope_copy(const rope *r);

 // Free the specified rope
 void rope_free(rope *r);

 // Get the number of characters in a rope
 size_t rope_char_count(rope *r);

 // Get the number of bytes which the rope would take up if stored as a utf8
 // string
 size_t rope_byte_count(rope *r);

 // Copies the rope's contents into a utf8 encoded C string. Also copies a trailing '\0' character.
 // Returns the number of bytes written, which is rope_byte_count(r) + 1.
 size_t rope_write_cstr(rope *r, uint8_t *dest);

 // Create a new C string which contains the rope. The string will contain
 // the rope encoded as utf8, followed by a trailing '\0'.
 // Use rope_byte_count(r) to get the length of the returned string.
 uint8_t *rope_create_cstr(rope *r);

 // Insert the given utf8 string into the rope at the specified position.
 void rope_insert(rope *r, size_t pos, const uint8_t *str);

 // Delete num characters at position pos. Deleting past the end of the string
 // has no effect.
 void rope_del(rope *r, size_t pos, size_t num);
  
 // This macro expands to a for() loop header which loops over the segments in a rope.
 //
 // Eg:
 //  rope *r = rope_new_with_utf8(str);
 //  ROPE_FOREACH(r, iter) {
 //    printf("%s", rope_node_data(iter));
 //  }
 #define ROPE_FOREACH(rope, iter) \
  for (rope_node *iter = &(rope)->head; iter != NULL; iter = iter->nexts[0].node)

 // Get the actual data inside a rope node.
 static inline uint8_t *rope_node_data(rope_node *n) {
  return n->str;
 }

 // Get the number of bytes inside a rope node. This is useful when you're looping through a rope.
 static inline size_t rope_node_num_bytes(rope_node *n) {
  return n->num_bytes;
 }

 // Get the number of characters inside a rope node.
 static inline size_t rope_node_chars(rope_node *n) {
  return n->nexts[0].skip_size;
 }
  
 #if ROPE_WCHAR
 // Get the number of wchar characters in the rope
 size_t rope_wchar_count(rope *r);

 // Insert the given utf8 string into the rope at the specified wchar position. This is compatible
 // with NSString, Javascript, etc. The string still needs to be passed in using UTF-8.
 //
 // Returns the insertion position in characters.
 size_t rope_insert_at_wchar(rope *r, size_t wchar_pos, const uint8_t *utf8_str);
  
 // Delete wchar_num wide characters at the specified wchar position offset.
 // Returns the deletion position in characters. *char_len_out is set to the deletion length, in
 // chars if its not null.
 // If the range is inside character boundaries, behaviour is undefined.
 size_t rope_del_at_wchar(rope *r, size_t wchar_pos, size_t wchar_num, size_t *char_len_out);
  
 // Get the number of wchars inside a rope node. This is useful when you're looping throuhg a rope.
 static inline size_t rope_node_wchars(rope_node *n) {
  return n->nexts[0].wchar_size;
 }
 #endif


  
 // For debugging.
 void _rope_check(rope *r);
 void _rope_print(rope *r);

 #ifdef __cplusplus
 }
 #endif

 #endif
	// https://github.com/josephg/librope

	#include <stdlib.h>
	#include <stdio.h>

	#include "rope.h"

	int
	main()
	{
	uint8_t *str;

	rope *r = rope_new();

	rope_insert(r, 0, "Hello, World!");
	str = malloc(rope_byte_count(r));
	rope_write_cstr(r, str);
	printf("%s\n", str);
	free(str);

	rope_del(r, 5, 7);
	str = malloc(rope_byte_count(r));
	rope_write_cstr(r, str);
	printf("%s\n", str);
	free(str);

	rope_insert(r, 5, ", Pootrick");
	str = malloc(rope_byte_count(r));
	rope_write_cstr(r, str);
	printf("%s\n", str);
	free(str);

	rope_free(r);

	return 0;
	}
	CFLAGS = -g -Wall -Wextra

	all:
	make rope
	gcc -o main main.c rope.o

	rope:
	gcc -o rope.o -c rope.c

	clean:
	rm -rf main *.dSYM rope.o
	/* UTF-8 Rope implementation by Joseph Gentle
	*
	* This library implements a heavyweight utf8 string type with fast
	* insert-at-position and delete-at-position operations.
	*
	* It uses skip lists instead of trees. Trees might be faster - who knows?
	*
	* Ropes are NOT THREAD SAFE. Do not call multiple rope methods
	* simultaneously from different threads.
	*/

	#ifndef librope_rope_h
	#define librope_rope_h

	#include <stdint.h>
	#include <stddef.h>

	// Whether or not the rope should support converting UTF-8 character offsets to wchar array
	// positions. This is useful when interoperating with strings in JS, Objective-C and many other
	// languages. See http://josephg.com/post/31707645955/string-length-lies
	//
	// Adding wchar conversion support decreases performance by about 30%.
	#ifndef ROPE_WCHAR
	#define ROPE_WCHAR 0
	#endif

	// These two magic values seem to be approximately optimal given the benchmark in
	// tests.c which does lots of small inserts.

	// Must be <= UINT16_MAX. Benchmarking says this is pretty close to optimal
	// (tested on a mac using clang 4.0 and x86_64).
	#ifndef ROPE_NODE_STR_SIZE
	#if ROPE_WCHAR
	#define ROPE_NODE_STR_SIZE 64
	#else
	#define ROPE_NODE_STR_SIZE 136
	#endif
	#endif

	// The likelyhood (%) a node will have height (n+1) instead of n
	#ifndef ROPE_BIAS
	#define ROPE_BIAS 25
	#endif

	// The rope will stop being efficient after the string is 2 ^ ROPE_MAX_HEIGHT nodes.
	#ifndef ROPE_MAX_HEIGHT
	#define ROPE_MAX_HEIGHT 60
	#endif

	struct rope_node_t;

	// The number of characters in str can be read out of nexts[0].skip_size.
	typedef struct {
	// The number of _characters_ between the start of the current node
	// and the start of next.
	size_t skip_size;

	// For some reason, librope runs about 1% faster when this next pointer is
	// exactly _here_ in the struct.
	struct rope_node_t *node;

	#if ROPE_WCHAR
	// The number of wide characters contained in space.
	size_t wchar_size;
	#endif
	} rope_skip_node;

	typedef struct rope_node_t {
	uint8_t str[ROPE_NODE_STR_SIZE];

	// The number of bytes in str in use
	uint16_t num_bytes;

	// This is the number of elements allocated in nexts.
	// Each height is 1/2 as likely as the height before. The minimum height is 1.
	uint8_t height;

	rope_skip_node nexts[];
	} rope_node;

	typedef struct {
	// The total number of characters in the rope.
	size_t num_chars;

	// The total number of bytes which the characters in the rope take up.
	size_t num_bytes;

	void (alloc)(size_t bytes);
	void (realloc)(void *ptr, size_t newsize);
	void (free)(void ptr);

	// The first node exists inline in the rope structure itself.
	rope_node head;
	} rope;

	#ifdef __cplusplus
	extern "C" {
	#endif

	// Create a new rope with no contents
	rope *rope_new();

	// Create a new rope using custom allocators.
	rope rope_new2(void (*alloc)(size_t bytes),
	void (realloc)(void *ptr, size_t newsize),
	void (free)(void ptr));

	// Create a new rope containing a copy of the given string. Shorthand for
	// r = rope_new(); rope_insert(r, 0, str);
	rope rope_new_with_utf8(const uint8_t str);

	// Make a copy of an existing rope
	rope rope_copy(const rope r);

	// Free the specified rope
	void rope_free(rope *r);

	// Get the number of characters in a rope
	size_t rope_char_count(rope *r);

	// Get the number of bytes which the rope would take up if stored as a utf8
	// string
	size_t rope_byte_count(rope *r);

	// Copies the rope's contents into a utf8 encoded C string. Also copies a trailing '\0' character.
	// Returns the number of bytes written, which is rope_byte_count(r) + 1.
	size_t rope_write_cstr(rope r, uint8_t dest);

	// Create a new C string which contains the rope. The string will contain
	// the rope encoded as utf8, followed by a trailing '\0'.
	// Use rope_byte_count(r) to get the length of the returned string.
	uint8_t rope_create_cstr(rope r);

	// Insert the given utf8 string into the rope at the specified position.
	void rope_insert(rope r, size_t pos, const uint8_t str);

	// Delete num characters at position pos. Deleting past the end of the string
	// has no effect.
	void rope_del(rope *r, size_t pos, size_t num);

	// This macro expands to a for() loop header which loops over the segments in a rope.
	//
	// Eg:
	// rope *r = rope_new_with_utf8(str);
	// ROPE_FOREACH(r, iter) {
	// printf("%s", rope_node_data(iter));
	// }
	#define ROPE_FOREACH(rope, iter) \
	for (rope_node *iter = &(rope)->head; iter != NULL; iter = iter->nexts[0].node)

	// Get the actual data inside a rope node.
	static inline uint8_t rope_node_data(rope_node n) {
	return n->str;
	}

	// Get the number of bytes inside a rope node. This is useful when you're looping through a rope.
	static inline size_t rope_node_num_bytes(rope_node *n) {
	return n->num_bytes;
	}

	// Get the number of characters inside a rope node.
	static inline size_t rope_node_chars(rope_node *n) {
	return n->nexts[0].skip_size;
	}

	#if ROPE_WCHAR
	// Get the number of wchar characters in the rope
	size_t rope_wchar_count(rope *r);

	// Insert the given utf8 string into the rope at the specified wchar position. This is compatible
	// with NSString, Javascript, etc. The string still needs to be passed in using UTF-8.
	//
	// Returns the insertion position in characters.
	size_t rope_insert_at_wchar(rope r, size_t wchar_pos, const uint8_t utf8_str);

	// Delete wchar_num wide characters at the specified wchar position offset.
	// Returns the deletion position in characters. *char_len_out is set to the deletion length, in
	// chars if its not null.
	// If the range is inside character boundaries, behaviour is undefined.
	size_t rope_del_at_wchar(rope r, size_t wchar_pos, size_t wchar_num, size_t char_len_out);

	// Get the number of wchars inside a rope node. This is useful when you're looping throuhg a rope.
	static inline size_t rope_node_wchars(rope_node *n) {
	return n->nexts[0].wchar_size;
	}
	#endif



	// For debugging.
	void _rope_check(rope *r);
	void _rope_print(rope *r);

	#ifdef __cplusplus
	}
	#endif

	#endif