added ternary trie implementation
							parent
							
								
									d7f95f0fbf
								
							
						
					
					
						commit
						0b97f124c5
					
				| 
						 | 
					@ -1,10 +1,15 @@
 | 
				
			||||||
cmake_minimum_required(VERSION 3.24)
 | 
					cmake_minimum_required(VERSION 3.20)
 | 
				
			||||||
project(lander C CXX)
 | 
					project(lander C CXX)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
set(CMAKE_C_STANDARD 17)
 | 
					set(CMAKE_C_STANDARD 17)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
add_subdirectory(crow)
 | 
					add_subdirectory(crow)
 | 
				
			||||||
include_directories(crow/include)
 | 
					add_subdirectory(tries)
 | 
				
			||||||
 | 
					include_directories(crow/include tries/include)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					if(CMAKE_BUILD_TYPE STREQUAL Release)
 | 
				
			||||||
 | 
					    add_compile_options(-O3 -flto)
 | 
				
			||||||
 | 
					endif()
 | 
				
			||||||
 | 
					
 | 
				
			||||||
add_executable(lander src/main.cpp)
 | 
					add_executable(lander src/main.cpp)
 | 
				
			||||||
target_link_libraries(lander PUBLIC Crow)
 | 
					target_link_libraries(lander PUBLIC Crow ternarytrie)
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
							
								
								
									
										9
									
								
								Makefile
								
								
								
								
							
							
						
						
									
										9
									
								
								Makefile
								
								
								
								
							| 
						 | 
					@ -20,6 +20,15 @@ $(BUILD_DIR)/Debug/Makefile: CMakeLists.txt
 | 
				
			||||||
build: cmake
 | 
					build: cmake
 | 
				
			||||||
	@ make -C '$(BUILD_DIR)/Debug'
 | 
						@ make -C '$(BUILD_DIR)/Debug'
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					.PHONY: cmake-release
 | 
				
			||||||
 | 
					cmake-release: $(BUILD_DIR)/Release/Makefile
 | 
				
			||||||
 | 
					$(BUILD_DIR)/Release/Makefile: CMakeLists.txt
 | 
				
			||||||
 | 
						@ cmake -B'$(BUILD_DIR)/Release' -DCMAKE_BUILD_TYPE=Release .
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					.PHONY: prod
 | 
				
			||||||
 | 
					prod: cmake-release
 | 
				
			||||||
 | 
						@ make -C '$(BUILD_DIR)/Release'
 | 
				
			||||||
 | 
					
 | 
				
			||||||
.PHONY: run
 | 
					.PHONY: run
 | 
				
			||||||
run: build
 | 
					run: build
 | 
				
			||||||
	@ ./build/Debug/lander
 | 
						@ ./build/Debug/lander
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -0,0 +1,8 @@
 | 
				
			||||||
 | 
					cmake_minimum_required(VERSION 3.20)
 | 
				
			||||||
 | 
					project(AD3-project-2022-2023 C)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					set(CMAKE_C_STANDARD 17)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					include_directories(include)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					add_library(ternarytrie STATIC include/ternarytrie.h src/ternarytrie.c)
 | 
				
			||||||
| 
						 | 
					@ -0,0 +1,72 @@
 | 
				
			||||||
 | 
					#ifndef AD3_TERNARYTRIE
 | 
				
			||||||
 | 
					#define AD3_TERNARYTRIE
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * The implementation of a Ternary Trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * Each node should be represented by a binary tree in order to reduce the memory usage.
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#include <stdbool.h>
 | 
				
			||||||
 | 
					#include <stddef.h>
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Type definition for the struct representing the current Trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * You can (and should) redefine this in your c-file with the concrete fields.
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					typedef struct ttrie TernaryTrie;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Allocate and initialize an empty Trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @return a pointer to an empty Trie struct
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					TernaryTrie* ternarytrie_init();
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * De-allocate a trie by freeing the memory occupied by this trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie which should be freed
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					void ternarytrie_free(TernaryTrie* trie);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Search whether a string is contained in this trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie
 | 
				
			||||||
 | 
					 * @param string
 | 
				
			||||||
 | 
					 * @return true if the string is contained within this trie, false otherwise
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					bool ternarytrie_search(TernaryTrie* trie, const char* string);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Add a string to this trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie
 | 
				
			||||||
 | 
					 * @param string
 | 
				
			||||||
 | 
					 * @return true if the trie was changed by this operation, false if it was already present
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					bool ternarytrie_add(TernaryTrie* trie, const char* string);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Remove a string from this trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * Note: strings added to this trie are considered to be "owned" by the caller.
 | 
				
			||||||
 | 
					 * Removing the string from the trie should not free the string's memory.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie
 | 
				
			||||||
 | 
					 * @param string
 | 
				
			||||||
 | 
					 * @return true if the string was present and has been removed, false if it was not present
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					bool ternarytrie_remove(TernaryTrie* trie, const char* string);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Returns the number of strings in this trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie
 | 
				
			||||||
 | 
					 * @return the number of strings in this trie
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					size_t ternarytrie_size(TernaryTrie* trie);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#endif //AD3_TERNARYTRIE
 | 
				
			||||||
| 
						 | 
					@ -0,0 +1,42 @@
 | 
				
			||||||
 | 
					#define ALPHABET_SIZE 256
 | 
				
			||||||
 | 
					#define DELIMITER '\0'
 | 
				
			||||||
 | 
					#define MAX(x, y) (((x) > (y)) ? (x) : (y))
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					#include <stdlib.h>
 | 
				
			||||||
 | 
					#include <string.h>
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Own implementation of strdup, heavily inspired by the glibc source code.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * This is neccessary because subGIT does not seem to have a strdup
 | 
				
			||||||
 | 
					 * implementation available for use.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param s string to duplicate
 | 
				
			||||||
 | 
					 * @return pointer to the newly allocated string
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					char *my_strdup(const char *s) {
 | 
				
			||||||
 | 
					  size_t len = strlen(s);
 | 
				
			||||||
 | 
					  char *new = malloc(len + 1);
 | 
				
			||||||
 | 
					  new[len] = DELIMITER;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return (char *)memcpy(new, s, len);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Own implementation of strndup, heavily inspired by the glibc source code.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * This is neccessary because subGIT does not seem to have a strndup
 | 
				
			||||||
 | 
					 * implementation available for use.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param s string to duplicate
 | 
				
			||||||
 | 
					 * @return pointer to the newly allocated string
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					char *my_strndup(const char *s, size_t n) {
 | 
				
			||||||
 | 
					  size_t string_len = strlen(s);
 | 
				
			||||||
 | 
					  size_t len = MAX(string_len, n);
 | 
				
			||||||
 | 
					  char *new = (char *)malloc(len + 1);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  new[len] = DELIMITER;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return (char *)memcpy(new, s, len);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
| 
						 | 
					@ -0,0 +1,247 @@
 | 
				
			||||||
 | 
					#include "ternarytrie.h"
 | 
				
			||||||
 | 
					#include "ternarytrie_node.c"
 | 
				
			||||||
 | 
					#include <stdint.h>
 | 
				
			||||||
 | 
					#include <stdlib.h>
 | 
				
			||||||
 | 
					#include <string.h>
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					typedef struct ttrie {
 | 
				
			||||||
 | 
					  TernaryTrieNode *root;
 | 
				
			||||||
 | 
					  size_t size;
 | 
				
			||||||
 | 
					} TernaryTrie;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Allocate and initialize an empty TernaryTrie
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @return pointer to the empty TernaryTrie
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline TernaryTrie *ternarytrie_init() {
 | 
				
			||||||
 | 
					  TernaryTrie *node = calloc(1, sizeof(TernaryTrie));
 | 
				
			||||||
 | 
					  node->root = ttnode_init();
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return node;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * De-allocate a TernaryTree by freeing its entire underlying structure.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie trie to free
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline void ternarytrie_free(TernaryTrie *trie) {
 | 
				
			||||||
 | 
					  ttnode_free(trie->root);
 | 
				
			||||||
 | 
					  free(trie);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					typedef struct searchresult {
 | 
				
			||||||
 | 
					  TernaryTrieNode *parent;
 | 
				
			||||||
 | 
					  TernaryTrieNode *child;
 | 
				
			||||||
 | 
					} SearchResult;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					SearchResult ternarytrie_search_node(TernaryTrie *trie, const char *string) {
 | 
				
			||||||
 | 
					  SearchResult out = {NULL, NULL};
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // Edge case for empty string
 | 
				
			||||||
 | 
					  if (string[0] == DELIMITER) {
 | 
				
			||||||
 | 
					    if (trie->root->type == 1) {
 | 
				
			||||||
 | 
					      out.child = trie->root;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    return out;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  size_t i = 0;
 | 
				
			||||||
 | 
					  TernaryTrieNode **node_ptr = &(trie->root);
 | 
				
			||||||
 | 
					  TernaryTrieNode **child_ptr;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  do {
 | 
				
			||||||
 | 
					    child_ptr = ttnode_search(*node_ptr, string[i], false);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    // We don't have to check whether *node_ptr is NULL, because if it was
 | 
				
			||||||
 | 
					    // NULL, it wouldn't be in the binary tree.
 | 
				
			||||||
 | 
					    if (child_ptr == NULL || *child_ptr == NULL) {
 | 
				
			||||||
 | 
					      return out;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    i++;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    if (string[i] == DELIMITER || (*child_ptr)->type == 2) {
 | 
				
			||||||
 | 
					      break;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    node_ptr = child_ptr;
 | 
				
			||||||
 | 
					  } while (1);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  if ((*child_ptr)->type == 2) {
 | 
				
			||||||
 | 
					    if (string[i] != DELIMITER &&
 | 
				
			||||||
 | 
					        strcmp(string + i, (*child_ptr)->ptr.string) == 0) {
 | 
				
			||||||
 | 
					      out.child = *child_ptr;
 | 
				
			||||||
 | 
					      out.parent = *node_ptr;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  // Here we know we've traversed through the entire string and have arrived at
 | 
				
			||||||
 | 
					  // a node that isn't a full leaf
 | 
				
			||||||
 | 
					  else if ((*child_ptr)->type == 1) {
 | 
				
			||||||
 | 
					    out.child = *child_ptr;
 | 
				
			||||||
 | 
					    out.parent = *node_ptr;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return out;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Returns whether the given string is present in the trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie trie to look in
 | 
				
			||||||
 | 
					 * @param string string to look up
 | 
				
			||||||
 | 
					 * @return true if the string is present in the trie, false otherwise
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline bool ternarytrie_search(TernaryTrie *trie, const char *string) {
 | 
				
			||||||
 | 
					  SearchResult res = ternarytrie_search_node(trie, string);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return res.child != NULL;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Add the given string to the TernaryTrie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie trie to add string to
 | 
				
			||||||
 | 
					 * @param string string to add
 | 
				
			||||||
 | 
					 * @return true if the string wasn't present in the trie and thus added, false
 | 
				
			||||||
 | 
					 * otherwise
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					bool ternarytrie_add(TernaryTrie *trie, const char *string) {
 | 
				
			||||||
 | 
					  // Edge case for empty string
 | 
				
			||||||
 | 
					  if (string[0] == DELIMITER) {
 | 
				
			||||||
 | 
					    if (trie->root->type == 0) {
 | 
				
			||||||
 | 
					      trie->root->type = 1;
 | 
				
			||||||
 | 
					      trie->size++;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      return true;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    return false;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  size_t i = 0;
 | 
				
			||||||
 | 
					  TernaryTrieNode **node_ptr = &(trie->root);
 | 
				
			||||||
 | 
					  TernaryTrieNode **new_node_ptr;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  do {
 | 
				
			||||||
 | 
					    new_node_ptr = ttnode_search(*node_ptr, string[i], true);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    // ttnode_search will only return NULL with create true if the node to look
 | 
				
			||||||
 | 
					    // in represents a full leaf. Therefore, we split the node and restart the
 | 
				
			||||||
 | 
					    // iteration.
 | 
				
			||||||
 | 
					    if (new_node_ptr == NULL) {
 | 
				
			||||||
 | 
					      // It's possible we've ended up in the full leaf node that represents this
 | 
				
			||||||
 | 
					      // string
 | 
				
			||||||
 | 
					      if (strcmp(string + i, (*node_ptr)->ptr.string) == 0) {
 | 
				
			||||||
 | 
					        return false;
 | 
				
			||||||
 | 
					      }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      ttnode_split(*node_ptr);
 | 
				
			||||||
 | 
					      continue;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    node_ptr = new_node_ptr;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    // The search function has added the character to the node
 | 
				
			||||||
 | 
					    i++;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    // The next node in the string's path doesn't exist yet, so we add it to the
 | 
				
			||||||
 | 
					    // trie
 | 
				
			||||||
 | 
					    if (*node_ptr == NULL) {
 | 
				
			||||||
 | 
					      TernaryTrieNode *new_node = ttnode_init();
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      // If there's a remaining part of the string, we add it to the leaf
 | 
				
			||||||
 | 
					      if (string[i] != DELIMITER) {
 | 
				
			||||||
 | 
					        ttnode_set_string(new_node, string + i);
 | 
				
			||||||
 | 
					      } else {
 | 
				
			||||||
 | 
					        new_node->type = 1;
 | 
				
			||||||
 | 
					      }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      *node_ptr = new_node;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      trie->size++;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      return true;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					  } while (string[i] != DELIMITER);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // If we've arrived here, we've traversed through the entire string and have
 | 
				
			||||||
 | 
					  // arrived at a node that already exists.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // The existing node is a full leaf, so we split it and make it
 | 
				
			||||||
 | 
					  // represent our new string.
 | 
				
			||||||
 | 
					  if ((*node_ptr)->type == 2) {
 | 
				
			||||||
 | 
					    ttnode_split(*node_ptr);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  // The string is already in the trie
 | 
				
			||||||
 | 
					  else if ((*node_ptr)->type == 1) {
 | 
				
			||||||
 | 
					    return false;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  (*node_ptr)->type = 1;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  trie->size++;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return true;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Remove the given string from a TernaryTrie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie trie to remove string from
 | 
				
			||||||
 | 
					 * @param string string to remove
 | 
				
			||||||
 | 
					 * @return true if the string was in the trie and thus removed, false otherwise
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					bool ternarytrie_remove(TernaryTrie *trie, const char *string) {
 | 
				
			||||||
 | 
					  SearchResult res = ternarytrie_search_node(trie, string);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  if (res.child == NULL) {
 | 
				
			||||||
 | 
					    return false;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  trie->size--;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  if (res.parent != NULL) {
 | 
				
			||||||
 | 
					    // We're removing a full leaf, so we calculate the offset of the character
 | 
				
			||||||
 | 
					    // to remove from the parent
 | 
				
			||||||
 | 
					    if (res.child->type == 2) {
 | 
				
			||||||
 | 
					      size_t str_len = strlen(string);
 | 
				
			||||||
 | 
					      size_t suffix_len = strlen(res.child->ptr.string);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      ttnode_remove(res.parent, string[str_len - suffix_len - 1]);
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    // In the other case, the character to remove from the parent is the last
 | 
				
			||||||
 | 
					    // character of the string
 | 
				
			||||||
 | 
					    else if (res.child->size == 0) {
 | 
				
			||||||
 | 
					      size_t i = 0;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      while (string[i + 1] != DELIMITER) {
 | 
				
			||||||
 | 
					        i++;
 | 
				
			||||||
 | 
					      }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      ttnode_remove(res.parent, string[i]);
 | 
				
			||||||
 | 
					    } else {
 | 
				
			||||||
 | 
					      res.child->type = 0;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      return true;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    ttnode_free(res.child);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  // We're in the root here
 | 
				
			||||||
 | 
					  else {
 | 
				
			||||||
 | 
					    res.child->type = 0;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return true;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Return the current size of the given trie.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param trie trie to return size for
 | 
				
			||||||
 | 
					 * @return size of the trie
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline size_t ternarytrie_size(TernaryTrie *trie) { return trie->size; }
 | 
				
			||||||
| 
						 | 
					@ -0,0 +1,312 @@
 | 
				
			||||||
 | 
					#include "common.c"
 | 
				
			||||||
 | 
					#include <stdbool.h>
 | 
				
			||||||
 | 
					#include <stdint.h>
 | 
				
			||||||
 | 
					#include <stdlib.h>
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Represents a node of the binary tree contained within each non-leaf
 | 
				
			||||||
 | 
					 * TernaryTrieNode.
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					typedef struct ttinode {
 | 
				
			||||||
 | 
					  struct ttinode *left;
 | 
				
			||||||
 | 
					  struct ttinode *right;
 | 
				
			||||||
 | 
					  struct ttnode *next;
 | 
				
			||||||
 | 
					  char key;
 | 
				
			||||||
 | 
					} TernaryTrieInnerNode;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Represents a node inside a TernaryTrie. A node can be in one of three states:
 | 
				
			||||||
 | 
					 * - Internal node: a node that's part of a path to a leaf node. This node will
 | 
				
			||||||
 | 
					 *   always have a size greater than one, and an initialized root.
 | 
				
			||||||
 | 
					 * - Leaf: a node solely used to represent a string ending there. Its size is 0,
 | 
				
			||||||
 | 
					 *   its ptr is unitialized and represents is true.
 | 
				
			||||||
 | 
					 * - Full leaf: a leaf node that contains a string. This occurs when a string is
 | 
				
			||||||
 | 
					 *   added whose path is not fully in the tree yet, causing its remaining suffix
 | 
				
			||||||
 | 
					 *   to be stored as a single node. Its size will be zero, represents its true,
 | 
				
			||||||
 | 
					 *   and its string pointer is initialized.
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					typedef struct ttnode {
 | 
				
			||||||
 | 
					  union {
 | 
				
			||||||
 | 
					    TernaryTrieInnerNode *root;
 | 
				
			||||||
 | 
					    char *string;
 | 
				
			||||||
 | 
					  } ptr;
 | 
				
			||||||
 | 
					  // What type of node this is
 | 
				
			||||||
 | 
					  // 0: regular non-representing node
 | 
				
			||||||
 | 
					  // 1: regular representing node
 | 
				
			||||||
 | 
					  // 2: full leaf
 | 
				
			||||||
 | 
					  uint8_t type;
 | 
				
			||||||
 | 
					  // Dependent on type
 | 
				
			||||||
 | 
					  // 0, 1: size of underlying binary tree
 | 
				
			||||||
 | 
					  // 2: length of string
 | 
				
			||||||
 | 
					  uint8_t size;
 | 
				
			||||||
 | 
					} TernaryTrieNode;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					// Required for recursively freeing tree structure
 | 
				
			||||||
 | 
					void ttnode_free(TernaryTrieNode *node);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Allocate and initialize a new TernaryTrieInnerNode representing a given
 | 
				
			||||||
 | 
					 * character.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param c character to represent
 | 
				
			||||||
 | 
					 * @return pointer to newly allocated struct
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline TernaryTrieInnerNode *ttinode_init(char c) {
 | 
				
			||||||
 | 
					  TernaryTrieInnerNode *node = calloc(1, sizeof(TernaryTrieInnerNode));
 | 
				
			||||||
 | 
					  node->key = c;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return node;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Allocate and initialize a new TernaryTrieNode.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @return pointer to newly allocated struct
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline TernaryTrieNode *ttnode_init() { return calloc(1, sizeof(TernaryTrieNode)); }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Free a TernaryTrieInnerNode and its underlying tree structure. This should
 | 
				
			||||||
 | 
					 * usually only be called on the root of a binary tree to free the entire
 | 
				
			||||||
 | 
					 * structure.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param node node whose tree to free
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					void ttinode_free_cascade(TernaryTrieInnerNode *node) {
 | 
				
			||||||
 | 
					  if (node->left != NULL) {
 | 
				
			||||||
 | 
					    ttinode_free_cascade(node->left);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  if (node->right != NULL) {
 | 
				
			||||||
 | 
					    ttinode_free_cascade(node->right);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  if (node->next != NULL) {
 | 
				
			||||||
 | 
					    ttnode_free(node->next);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  free(node);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Free a TernaryTrieNode and its underlying tree structure.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param node node to free
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					void ttnode_free(TernaryTrieNode *node) {
 | 
				
			||||||
 | 
					  if (node->type == 2) {
 | 
				
			||||||
 | 
					    free(node->ptr.string);
 | 
				
			||||||
 | 
					  } else if (node->size != 0) {
 | 
				
			||||||
 | 
					    ttinode_free_cascade(node->ptr.root);
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  free(node);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Add the string to the given node & set its type accordingely.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param node node to add string to
 | 
				
			||||||
 | 
					 * @param string string to add
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline void ttnode_set_string(TernaryTrieNode *node, const char *string) {
 | 
				
			||||||
 | 
					  node->type = 2;
 | 
				
			||||||
 | 
					  node->size = strlen(string);
 | 
				
			||||||
 | 
					  node->ptr.string = my_strdup(string);
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * This function performs a lookup in the underlying binary tree of the given
 | 
				
			||||||
 | 
					 * TernaryTrieNode. If found, the return value is a pointer to the memory
 | 
				
			||||||
 | 
					 * location where the TernaryTrieInnerNode representing the given character
 | 
				
			||||||
 | 
					 * stores its `next` field. If not found, the return value is NULL, unless
 | 
				
			||||||
 | 
					 * `create` is true.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * NOTE: a non-NULL return value does not mean that the dereferenced value is
 | 
				
			||||||
 | 
					 * also not NULL. In particular, if `create` is set to true and the function had
 | 
				
			||||||
 | 
					 * to create the new node, the dereferenced value will always be NULL.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param node node to perform lookup in. If node is a full leaf, the return
 | 
				
			||||||
 | 
					 * value will always be NULL, regardless of the value of create.
 | 
				
			||||||
 | 
					 * @param create whether to create the TernaryTrieInnerNode if it isn't present
 | 
				
			||||||
 | 
					 * yet. If this is set to true, the function will never return NULL unless the
 | 
				
			||||||
 | 
					 * node represents a leaf with a string, because the struct and therefore the
 | 
				
			||||||
 | 
					 * address is created if it doesn't exist yet.
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					TernaryTrieNode **ttnode_search(TernaryTrieNode *node, const char c,
 | 
				
			||||||
 | 
					                                bool create) {
 | 
				
			||||||
 | 
					  // Full leafs will always return NULL
 | 
				
			||||||
 | 
					  if (node->type == 2) {
 | 
				
			||||||
 | 
					    return NULL;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // It can happen that the node has no initialized root yet
 | 
				
			||||||
 | 
					  if (node->size == 0) {
 | 
				
			||||||
 | 
					    if (create) {
 | 
				
			||||||
 | 
					      node->size++;
 | 
				
			||||||
 | 
					      node->ptr.root = ttinode_init(c);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      return &node->ptr.root->next;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    return NULL;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  TernaryTrieInnerNode *parent = node->ptr.root;
 | 
				
			||||||
 | 
					  TernaryTrieInnerNode *child;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // Iterate through the tree until we either find the character or realize it's
 | 
				
			||||||
 | 
					  // not present in the tree
 | 
				
			||||||
 | 
					  // FIXME don't use while (1)
 | 
				
			||||||
 | 
					  while (1) {
 | 
				
			||||||
 | 
					    if (parent->key == c) {
 | 
				
			||||||
 | 
					      return &parent->next;
 | 
				
			||||||
 | 
					    } else if (c < parent->key) {
 | 
				
			||||||
 | 
					      child = parent->left;
 | 
				
			||||||
 | 
					    } else {
 | 
				
			||||||
 | 
					      child = parent->right;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    if (child == NULL) {
 | 
				
			||||||
 | 
					      break;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    parent = child;
 | 
				
			||||||
 | 
					  };
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // child is NULL, meaning the character isn't in the binary tree yet.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // If create is true, we create the new node so that we can still return a
 | 
				
			||||||
 | 
					  // non-NULL pointer.
 | 
				
			||||||
 | 
					  if (create) {
 | 
				
			||||||
 | 
					    TernaryTrieInnerNode *new_node = ttinode_init(c);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    if (c < parent->key) {
 | 
				
			||||||
 | 
					      parent->left = new_node;
 | 
				
			||||||
 | 
					    } else {
 | 
				
			||||||
 | 
					      parent->right = new_node;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    node->size++;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    return &new_node->next;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  return NULL;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Split a remaining string leaf node in two. This function assumes it receives
 | 
				
			||||||
 | 
					 * a full leaf as its input.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param node node to split
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					void ttnode_split(TernaryTrieNode *node) {
 | 
				
			||||||
 | 
					  TernaryTrieNode *new_node = ttnode_init();
 | 
				
			||||||
 | 
					  char key = node->ptr.string[0];
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // There's a chance the remaining string was only 1 character, meaning the new
 | 
				
			||||||
 | 
					  // node doesn't have to store a string
 | 
				
			||||||
 | 
					  if (node->ptr.string[1] != DELIMITER) {
 | 
				
			||||||
 | 
					    ttnode_set_string(new_node, node->ptr.string + 1);
 | 
				
			||||||
 | 
					  } else {
 | 
				
			||||||
 | 
					    new_node->type = 1;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  node->type = 0;
 | 
				
			||||||
 | 
					  node->size = 0;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  free(node->ptr.string);
 | 
				
			||||||
 | 
					  node->ptr.string = NULL;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // Initialize node's binary tree with the correct character
 | 
				
			||||||
 | 
					  TernaryTrieNode **node_ptr = ttnode_search(node, key, true);
 | 
				
			||||||
 | 
					  *node_ptr = new_node;
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/*
 | 
				
			||||||
 | 
					 * Remove the given character from a TernaryTrieInnerNode's subtree. The
 | 
				
			||||||
 | 
					 * function assumes the character is indeed in the subtree.
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					void ttinode_remove(TernaryTrieInnerNode *node, const char c) {
 | 
				
			||||||
 | 
					  TernaryTrieInnerNode **to_remove_ptr = &node;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // We use pointers to pointers here so we can later free the removed node
 | 
				
			||||||
 | 
					  // without having to know what its parent is
 | 
				
			||||||
 | 
					  while ((*to_remove_ptr)->key != c) {
 | 
				
			||||||
 | 
					    to_remove_ptr = (c < (*to_remove_ptr)->key) ? &(*to_remove_ptr)->left
 | 
				
			||||||
 | 
					                                                : &(*to_remove_ptr)->right;
 | 
				
			||||||
 | 
					  };
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  // If the node isn't a leaf, we have to replace it with another
 | 
				
			||||||
 | 
					  if ((*to_remove_ptr)->left != NULL || (*to_remove_ptr)->right != NULL) {
 | 
				
			||||||
 | 
					    TernaryTrieInnerNode *to_replace = *to_remove_ptr;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    // Replace with its only right child
 | 
				
			||||||
 | 
					    if (to_replace->left == NULL) {
 | 
				
			||||||
 | 
					      TernaryTrieInnerNode *to_remove = to_replace->right;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      to_replace->key = to_remove->key;
 | 
				
			||||||
 | 
					      to_replace->next = to_remove->next;
 | 
				
			||||||
 | 
					      to_replace->left = to_remove->left;
 | 
				
			||||||
 | 
					      to_replace->right = to_remove->right;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      free(to_remove);
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    // Replace with its only left child
 | 
				
			||||||
 | 
					    else if (to_replace->right == NULL) {
 | 
				
			||||||
 | 
					      TernaryTrieInnerNode *to_remove = to_replace->left;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      to_replace->key = to_remove->key;
 | 
				
			||||||
 | 
					      to_replace->next = to_remove->next;
 | 
				
			||||||
 | 
					      to_replace->left = to_remove->left;
 | 
				
			||||||
 | 
					      to_replace->right = to_remove->right;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      free(to_remove);
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    // Node has two children, so replace with successor
 | 
				
			||||||
 | 
					    else {
 | 
				
			||||||
 | 
					      TernaryTrieInnerNode *to_remove_parent = to_replace;
 | 
				
			||||||
 | 
					      TernaryTrieInnerNode *to_remove = to_replace->right;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      while (to_remove->left != NULL) {
 | 
				
			||||||
 | 
					        to_remove_parent = to_remove;
 | 
				
			||||||
 | 
					        to_remove = to_remove->left;
 | 
				
			||||||
 | 
					      }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      to_replace->key = to_remove->key;
 | 
				
			||||||
 | 
					      to_replace->next = to_remove->next;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      if (to_remove_parent != to_replace) {
 | 
				
			||||||
 | 
					        to_remove_parent->left = to_remove->right;
 | 
				
			||||||
 | 
					      } else {
 | 
				
			||||||
 | 
					        to_remove_parent->right = to_remove->right;
 | 
				
			||||||
 | 
					      }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      free(to_remove);
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					  // We're the leaf, so we free ourselves
 | 
				
			||||||
 | 
					  else {
 | 
				
			||||||
 | 
					    free(*to_remove_ptr);
 | 
				
			||||||
 | 
					    *to_remove_ptr = NULL;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					/**
 | 
				
			||||||
 | 
					 * Remove the given character from a TernaryTrieNode, respecting the rules
 | 
				
			||||||
 | 
					 * of a binary search tree. This function assumes the character is in the search
 | 
				
			||||||
 | 
					 * tree.
 | 
				
			||||||
 | 
					 *
 | 
				
			||||||
 | 
					 * @param node node to remove character from
 | 
				
			||||||
 | 
					 * @param c character to remove
 | 
				
			||||||
 | 
					 */
 | 
				
			||||||
 | 
					inline void ttnode_remove(TernaryTrieNode *node, const char c) {
 | 
				
			||||||
 | 
					  ttinode_remove(node->ptr.root, c);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  node->size--;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  if (node->size == 0) {
 | 
				
			||||||
 | 
					    node->ptr.root = NULL;
 | 
				
			||||||
 | 
					  }
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
		Loading…
	
		Reference in New Issue