Lecture 35 - Dec 1, 2023
Last lecture
Delete a node in BST.
Today
Hash tables
Data structures and run time of operations
| Unsorted List | Sorted List | BST |
Insert | O(1) | O(n) | O(log n) |
Search | O(n) | O(log n) | O(log n) |
Hash tables
Hash tables provides average performance on search/insert/deletion.
- Very large array
- Each key maps to a unique index
- Hash function
maps key to array index
Example:
Use cases:
- Databases
- Caching
In both cases quick data retrieval is critical.
Example:
insert(16): h(16) = 2
insert(25): h(25) = 4
insert(77): h(77) = 0
insert(7): h(7) = 2
0 | 77
1 |
2 | 16
3 |
4 | 25
5 |
6 |
Problem
Collision happens when two keys map to the same index.
Solution 1: Hashing with chaining
Each hash table entry contrains a pointer to a linked list of keys that map to the same entry.
But we may have collisions always and one array entry has a linked list of all keys. This leads to an
Usually, good hash functions can reduce the number of collisions. Ideally, we want the length of each linked list to be one maximum.
Usually, good hash function involve multiplying key with large prime number (e.g.,
0 | 77 -> 7
1
2 | 16
3
4 | 25
5
6
class Node {
// for simplicity, all data members are public
public:
int key;
*next;
Node ~Node() { delete next; }
};
class List {
public:
(); // sets head to NULL
Listbool isEmpty(); // returns true if head is NULL
void insert(int v); // inserts at head
* remove(int k); // removes first node with key = k
ListNodebool isFound(int k); // returns true if key k is found
~List();
};
#define SIZE 7
class HashTable {
private:
** table;
Listpublic:
() {
HashTable= new List*[SIZE];
table for (int i = 0; i < SIZE; i++) {
[i] = NULL;
table}
}
bool search(int v) {
int idx = v % SIZE;
if (table[idx] != NULL) {
// table[idx] is of class List*
return table[idx]->isFound(v);
} else {
return false; // the list where v should be is not there
}
}
void insert(int v) {
if (search(v)) { // value already there
return;
} else {
int idx = v % SIZE;
if (table[idx] == NULL) {
[idx] = new List();
table}
// table[idx] is of class List*
[idx]->insert(v);
table}
}
~HashTable() {
for (int i = 0; i < SIZE; i++) {
delete table[i];
}
delete[] table;
}
void remove(int v);
};
Homework: Implement remove for HashTable.
Solution 2: Closed hashing with linear probing
If hash function lead to collision, insert value at the next available space in the table.
Linear probing is used tp find the next available space in the table.
Additional code from the class
List.h
:
#ifndef LIST_H_
#define LIST_H_
#include <iostream>
using namespace std;
class Node {
public:
int key;
* next;
Node~Node(){delete next;}
};
class List {
private:
* head;
Node
public:
(){head = NULL;}
List
bool isFound(int k) {
* p = head;
Nodewhile (p != NULL) {
// cout << "p->name is " << p->name << " and name is " << name << endl;
if (p->key == k) {
return true;
}
= p->next;
p }
return false;
}
* remove(int v) {
Node* p = head;
Node* prev = NULL;
Nodewhile (p != NULL) {
if (p->key == v) {
if (prev != NULL) {
->next = p->next;
prev->next = NULL;
p} else {
= p->next;
head ->next = NULL;
p}
return p;
}
= p;
prev = p->next;
p }
return NULL;
}
void insert(int v) {
* node = new Node;
Node->key = v;
node->next = NULL;
node->next = head;
node= node;
head }
void print(){
* current = head;
Nodewhile(current != NULL){
<< current->key << " ";
cout = current->next;
current }
<< endl;
cout }
~List() { delete head; }
};
#endif
HashTable.h
:
#ifndef HASH_H_
#define HASH_H_
#define SIZE 7
#include "List.h"
class HashTable {
private:
** table;
List
public:
() {
HashTable= new List*[SIZE];
table for (int i = 0; i < SIZE; i++) {
[i] = NULL;
table}
}
bool search(int v) {
int idx = v % SIZE;
if (table[idx] != NULL) {
return table[idx]->isFound(v);
} else {
return false;
}
}
void insert(int v) {
if (search(v)) {
return;
} else {
int idx = v % SIZE;
if (table[idx] == NULL) {
[idx] = new List;
table}
[idx]->insert(v);
table}
}
void display() {
for (int i = 0; i < SIZE; i++) {
if (table[i] != NULL) {
[i]->print();
table}
}
}
void remove(int v) {
if (!search(v)) {
return;
} else {
int idx = v % SIZE;
if (table[idx] == NULL) {
return;
} else {
delete table[idx]->remove(v);
}
}
}
~HashTable() {
for (int i = 0; i < SIZE; i++) {
delete table[i];
}
delete[] table;
}
};
#endif
main.cpp
:
#include <iostream>
#include "HashTable.h"
using namespace std;
int main(){
;
HashTable H.insert(4);
H.insert(7);
H.insert(77);
H
.remove(77);
H.display();
Hreturn 0;
}