pavlosdais
diff --git a/‎HashTable/Linear Hashing/README.md
Copy file name to clipboard
+14Lines changed: 14 additions & 0 deletions b/‎HashTable/Linear Hashing/README.md
Copy file name to clipboard
+14Lines changed: 14 additions & 0 deletions
diff --git a/‎HashTable/Linear Hashing/hash_table.c
Copy file name to clipboard
+290Lines changed: 290 additions & 0 deletions b/‎HashTable/Linear Hashing/hash_table.c
Copy file name to clipboard
+290Lines changed: 290 additions & 0 deletions
diff --git a/‎HashTable/Linear Hashing/hash_table.h
Copy file name to clipboard
+44Lines changed: 44 additions & 0 deletions b/‎HashTable/Linear Hashing/hash_table.h
Copy file name to clipboard
+44Lines changed: 44 additions & 0 deletions
diff --git a/‎HashTable/README.md
Copy file name to clipboard
+1-11Lines changed: 1 addition & 11 deletions b/‎HashTable/README.md
Copy file name to clipboard
+1-11Lines changed: 1 addition & 11 deletions
diff --git a/‎HashTable/Seperate chaining/README.md
Copy file name to clipboard
+11Lines changed: 11 additions & 0 deletions b/‎HashTable/Seperate chaining/README.md
Copy file name to clipboard
+11Lines changed: 11 additions & 0 deletions
@@ -0,0 +1,14 @@
+This is an implentation using linear hashing. Linear hashing is a dynamic data structure which implements a hash table and grows or shrinks one bucket at a time. A Linear hashing file expands by splitting a pre-determined bucket into two. The trigger for the split in this implementation is an overflow of elements at the bucket (by default 4). In order to access a record with key, a family of hash functions, called collectively a dynamic hash function is applied to the key c. At any time, at most two hash functions h(i) and h(i+1) are used.
+
+# Performance
+If n is the number of elements in the hash table:
+
+Algorithm  | Average case | Worst case
+---------- | -------      | ----------
+Space	   | O(n)	      | O(n)
+Insert	   | O(1)	      | O(n)
+Remove	   | O(1)	      | O(1)
+Search	   | O(1)	      | O(1)
+
+# Learn more
+For more information as well as examples click [here](https://www.alexdelis.eu/M149/e_ds_linearhashing.pdf).
@@ -0,0 +1,290 @@
+#include <stdio.h>
+#include <stdlib.h>
+#include <assert.h>
+#include "hash_table.h"
+
+typedef unsigned char small_int;
+
+// bucket
+typedef struct n
+{
+    Pointer data;     // pointer to the data we are storing
+    uint hash_value;  // hash value of the data
+    struct n* next;   // next element in the bucket (NULL if it's the last)
+}
+n;
+typedef struct n* node;
+
+typedef struct hash_table
+{
+    uint curr_size;                   // used number of buckets
+    uint max_capacity;                // max number of buckets
+    uint elements;                    // number of elements in the hash table
+    uint exponent;                    // current explonent (in collaboration with find_func, it is used to find the hash value)
+    uint next_split;                  // next bucket to be splited
+    small_int* curr_num_of_elements;  // number of elements in each bucket
+    node* buckets;                    // buckets (lists) storing the data
+    HashFunc hash;                    // function that hashes an element into a positive integer
+    CompareFunc compare;              // function that compares the elements
+    DestroyFunc destroy;              // function that destroys the elements, NULL if not
+}
+hash_table;
+
+
+#define STARTING_HASH_CAPACITY 50  // starting maximum number of buckets
+#define MAX_BUCKET_ELEMENTS 4      // maximum number of elements in the bucket
+#define INCREASE_SIZE 1.8          // increase percentage of maximum number of buckets
+
+
+// Function Prototypes
+static void hash_resize(HashTable ht);
+static uint get_bucket(HashTable ht, uint hash_value);
+static uint find_func(uint i);
+static uint hash_search(HashTable ht, Pointer value);
+
+void hash_init(HashTable* ht, HashFunc hash, CompareFunc compare, DestroyFunc destroy)
+{
+    assert(hash != NULL && compare != NULL);  // a hash and compare function needs to be given
+    
+    *ht = malloc(sizeof(hash_table));
+    assert(*ht != NULL);  // allocation failure
+
+    (*ht)->buckets = calloc(sizeof(n), STARTING_HASH_CAPACITY);  // allocate memory for the buckets
+    assert((*ht)->buckets != NULL);  // allocation failure
+
+    (*ht)->curr_num_of_elements = calloc(sizeof(small_int), STARTING_HASH_CAPACITY);
+    assert((*ht)->curr_num_of_elements != NULL);  // allocation failure
+
+    (*ht)->max_capacity = STARTING_HASH_CAPACITY;
+    (*ht)->elements = 0;
+    (*ht)->exponent = 0;
+    
+    (*ht)->curr_size = 1;
+    (*ht)->next_split = 0;
+
+    // initialize functions
+    (*ht)->hash = hash;
+    (*ht)->compare = compare;
+    (*ht)->destroy = destroy;
+}
+
+bool hash_insert(HashTable ht, Pointer value)
+{
+    // check to see if value already exists
+    uint bucket = hash_search(ht, value);
+    if (bucket == -1)  // value already exists
+        return false;
+    
+    // create new node
+    node new_node = malloc(sizeof(n));
+    assert(new_node != NULL);  // allocation failure
+
+    // fill node's contents
+    new_node->data = value;
+    
+    uint hash_value = ht->hash(value);
+    new_node->hash_value = hash_value;
+
+    // insert the value at the start of the bucket
+    new_node->next = ht->buckets[bucket];
+    ht->buckets[bucket] = new_node;
+
+    ht->curr_num_of_elements[bucket]++;
+    
+    // split if an overflow occurs
+    if (ht->curr_num_of_elements[bucket] > MAX_BUCKET_ELEMENTS)  // max number of elements in the bucket exceeded - overflow
+    {
+        // get new bucket
+        ht->curr_size++;
+        
+        // maximum capacity of buckets reached, increase size
+        if (ht->curr_size == ht->max_capacity)
+            hash_resize(ht);
+        
+        node* new_bucket = &(ht->buckets[ht->curr_size-1]);
+
+        // bucket to be splitted
+        node* old_bucket = &(ht->buckets[ht->next_split]);
+
+        ht->next_split++;        
+
+        // split operation
+        while ((*old_bucket) != NULL)
+        {
+            if (get_bucket(ht, (*old_bucket)->hash_value) != ht->next_split-1)
+            {
+                ht->curr_num_of_elements[ht->next_split-1]--;
+                ht->curr_num_of_elements[ht->curr_size-1]++;
+
+                *new_bucket = *old_bucket;
+                *old_bucket = (*old_bucket)->next;
+                new_bucket = &((*new_bucket)->next);
+                *new_bucket = NULL;
+            }
+            else
+                old_bucket = &((*old_bucket)->next);
+        }
+
+        if (find_func(ht->exponent+1) <= ht->curr_size)
+        {
+            // start next round of splitting
+            ht->exponent++;
+            ht->next_split = 0;
+        }
+    }
+
+    ht->elements++;  // value inserted, increment the number of elements in the hash table
+    return true;
+}
+
+bool hash_remove(HashTable ht, Pointer value)
+{
+    // find the potential bucket the value belongs to
+    uint h = get_bucket(ht, ht->hash(value));
+
+    node* bkt = &(ht->buckets[h]);
+    
+    // search for the value in the bucket
+    while (*bkt != NULL)
+    {
+        Pointer bkt_value = (*bkt)->data;
+        
+        if (ht->compare(value, bkt_value) == 0)  // value found
+        {
+            node tmp = *bkt;
+            (*bkt) = (*bkt)->next;
+
+            // if a destroy function exists, destroy the value
+            if (ht->destroy != NULL)
+                ht->destroy(tmp->data);
+            
+            free(tmp);
+            
+            ht->curr_num_of_elements[h]--;
+            ht->elements--;  // value removed, decrement the number of elements in the hash table
+            return true;
+        }
+        else  // search next value
+            bkt = &((*bkt)->next);
+    }
+    return false;
+}
+
+bool hash_exists(HashTable ht, Pointer value)
+{
+    if (hash_search(ht, value) == -1)  // value exists
+        return true;
+    
+    // value does not exist
+    return false;
+}
+
+// returns -1 if the value exists
+// if it does not exist, returns the bucket in which it should exist
+static uint hash_search(HashTable ht, Pointer value)
+{
+    // find the potential bucket the value belongs to
+    uint h = get_bucket(ht, ht->hash(value));
+
+    // search for the value in the bucket
+    node bkt = ht->buckets[h];
+    while (bkt != NULL)
+    {
+        Pointer bkt_value = bkt->data;
+        if (ht->compare(value, bkt_value) == 0)  // value found
+            return -1;
+            
+        bkt = bkt->next;
+    }
+    return h;
+}
+
+static uint get_bucket(HashTable ht, uint hash_value)
+{
+    // use hash function i
+    uint pos = hash_value % find_func(ht->exponent);
+
+    if (pos < ht->next_split)
+        // use hash function i+1
+        pos = hash_value % find_func(ht->exponent+1);   
+
+    return pos;
+}
+
+// resize by INCREASE_SIZE
+static void hash_resize(HashTable ht)
+{
+    uint old_cap = ht->max_capacity;
+    ht->max_capacity *= INCREASE_SIZE;  // increase capacity
+    
+    ht->buckets = realloc(ht->buckets, sizeof(*(ht->buckets)) * ht->max_capacity);
+    assert(ht->buckets != NULL);  // allocation failure
+
+    ht->curr_num_of_elements = realloc(ht->curr_num_of_elements, sizeof(small_int) * ht->max_capacity);
+    assert(ht->curr_num_of_elements != NULL);  // allocation failure
+
+    // initialize arrays to avoid annoying errors
+    for (uint i = old_cap; i < ht->max_capacity; i++)
+    {
+        ht->buckets[i] = NULL;
+        ht->curr_num_of_elements[i] = 0;
+    }
+}
+
+void print_table(HashTable ht, VisitFunc visit)
+{
+    for (uint i = 0; i < ht->curr_size; i++)
+    {
+        node tmp = ht->buckets[i];
+        printf("(%d): ", i);
+        while (tmp != NULL)
+        {
+            visit(tmp->data);
+            tmp = tmp->next;
+        }
+
+        // print the number of elements in the bucket
+        printf("|%d|", ht->curr_num_of_elements[i]);
+        printf("\n");
+    }
+}
+
+uint hash_size(HashTable ht)
+{
+    return ht->elements;
+}
+
+// returns 2^i
+static uint find_func(uint i)
+{
+    return 1 << i;
+}
+
+DestroyFunc hash_set_destroy(HashTable ht, DestroyFunc new_destroy_func)
+{
+    DestroyFunc old_destroy_func = ht->destroy;
+    ht->destroy = new_destroy_func;
+    return old_destroy_func;
+}
+
+void hash_destroy(HashTable ht)
+{
+    // destroy buckets
+    for (uint i = 0; i < ht->max_capacity; i++)
+    {
+        node bkt = ht->buckets[i];
+        while (bkt != NULL)
+        {
+            node tmp = bkt;
+            bkt = bkt->next;
+
+            // if a destroy function is given, destroy the elements
+            if (ht->destroy != NULL) 
+                ht->destroy(tmp->data);
+            free(tmp);
+        }
+    }
+    free(ht->curr_num_of_elements);
+    free(ht->buckets);
+    free(ht);
+}
@@ -0,0 +1,44 @@
+#include <stdbool.h>
+
+typedef struct hash_table* HashTable;
+
+typedef void* Pointer;
+
+// Pointer to function that compares 2 elements a and b and returns 0 if a and b are equal
+typedef int (*CompareFunc)(Pointer a, Pointer b);
+
+// Pointer to function that destroys an element value
+typedef void (*DestroyFunc)(Pointer value);
+
+// Pointer to function that hashes a value to a positive integer
+typedef uint (*HashFunc)(Pointer value);
+
+// Pointer to function that visits an element
+typedef void (*VisitFunc)(Pointer value);
+
+
+// initializes hash table
+void hash_init(HashTable* ht, HashFunc hash, CompareFunc compare, DestroyFunc destroy);
+
+// inserts value at the hash table
+// returns true if the value was inserted, false if it already exists
+bool hash_insert(HashTable ht, Pointer value);
+
+// removes the value from the hash table and destroys its value if a destroy function was given
+// returns true if the value was deleted, false if it does not exist and thus it was not deleted
+bool hash_remove(HashTable ht, Pointer value);
+
+// returns true if value exists in the hash table, false otherwise
+bool hash_exists(HashTable ht, Pointer value);
+
+// changes destroy function and return the old one
+DestroyFunc hash_set_destroy(HashTable ht, DestroyFunc new_destroy_func);
+
+// returns the number of elements inserted
+unsigned int hash_size(HashTable ht);
+
+// prints hash table
+void print_table(HashTable ht, VisitFunc visit);
+
+// destroys the hash table and its values, if a destroy function is given
+void hash_destroy(HashTable ht);
@@ -1,11 +1 @@
-[Hash table](https://en.wikipedia.org/wiki/Hash_table) also known as hash map, is a data structure that implements a set abstract data type, a structure that can map keys to values. A hash table uses a hash function to compute an index, also called a hash code, into an array of buckets or slots, from which the desired value can be found.
-
-## Performance
-This is an implentation using separate chaining. In separate chaining, each slot of the hash table is a linked list. When two or more elements are hashed to the same location (when a collision occurs), these elements are represented into a singly-linked list much like a chain. If there are n elements and b is the number of the buckets there would be n/b entries on each bucket. This value n/b is called the load factor that represents the load that is there on our map. So, theoretically, when the load factor increases so does the complexity of the operations. In order for the load factor to be kept low and remain almost constant complexity, we increase the number of buckets (approximately doubling) and rehash once the load factor increases to more than a pre-defined value (the default value here is 1.2).
-
-Algorithm  | Average case | Worst case
----------- | -------      | ----------
-Space	   | O(n)	      | O(n)
-Insert	   | O(1)	      | O(n)
-Remove	   | O(1)	      | O(n)
-Search	   | O(1)	      | O(n)
+[Hash table](https://en.wikipedia.org/wiki/Hash_table) also known as hash map, is a data structure that implements a set abstract data type, a structure that can map keys to values. A hash table uses a hash function to compute an index, also called a hash code, into an array of buckets or slots, from which the desired value can be found.
@@ -0,0 +1,11 @@
+This is an implentation using separate chaining. In separate chaining, each slot of the hash table is a linked list. When two or more elements are hashed to the same location (when a collision occurs), these elements are represented into a singly-linked list much like a chain. If there are n elements and b is the number of the buckets there would be n/b entries on each bucket. This value n/b is called the load factor that represents the load that is there on our map. So, theoretically, when the load factor increases so does the complexity of the operations. In order for the load factor to be kept low and remain almost constant complexity, we increase the number of buckets (approximately doubling) and rehash once the load factor increases to more than a pre-defined value (the default value here is 1.2).
+
+## Performance
+If n is the number of elements in the hash table:
+
+Algorithm  | Average case | Worst case
+---------- | -------      | ----------
+Space	   | O(n)	      | O(n)
+Insert	   | O(1)	      | O(n)
+Remove	   | O(1)	      | O(n)
+Search	   | O(1)	      | O(n)