Sort numbers stored on different machines

Hello Everyone,

Given N machines. Each machine contains some numbers in sorted form. But the amount of numbers, each machine has is not fixed. Output the numbers from all the machine in sorted non-decreasing form.
Example:

Machine M1 contains 3 numbers: {30, 40, 50} Machine M2 contains 2 numbers: {35, 45} Machine M3 contains 5 numbers: {10, 60, 70, 80, 100} Output: {10, 30, 35, 40, 45, 50, 60, 70, 80, 100}

Representation of stream of numbers on each machine is considered as linked list. A Min Heap can be used to print all numbers in sorted order.

Following is the detailed process

1. Store the head pointers of the linked lists in a minHeap of size N where N is number of machines.

2. Extract the minimum item from the minHeap. Update the minHeap by replacing the head of the minHeap with the next number from the linked list or by replacing the head of the minHeap with the last number in the minHeap followed by decreasing the size of heap by 1.

3. Repeat the above step 2 until heap is not empty.

Below is C++ implementation of the above approach.

// A program to take numbers from different machines and print them in sorted order

#include <stdio.h>

// A Linked List node

struct ListNode

{

int data;

struct ListNode* next;

};

// A Min Heap Node

struct MinHeapNode

{

ListNode* head;

};

// A Min Heao (Collection of Min Heap nodes)

struct MinHeap

{

int count;

int capacity;

MinHeapNode* array;

};

// A function to create a Min Heap of given capacity

MinHeap* createMinHeap( int capacity )

{

MinHeap* minHeap = new MinHeap;

minHeap->capacity = capacity;

minHeap->count = 0;

minHeap->array = new MinHeapNode [minHeap->capacity];

return minHeap;

}

/* A utility function to insert a new node at the beginning

of linked list */

void push (ListNode** head_ref, int new_data)

{

/* allocate node */

ListNode* new_node = new ListNode;

/* put in the data */

new_node->data = new_data;

/* link the old list off the new node */

new_node->next = (*head_ref);

/* move the head to point to the new node */

(*head_ref) = new_node;

}

// A utility function to swap two min heap nodes. This function

// is needed in minHeapify

void swap( MinHeapNode* a, MinHeapNode* b )

{

MinHeapNode temp = *a;

*a = *b;

*b = temp;

}

// The standard minHeapify function.

void minHeapify( MinHeap* minHeap, int idx )

{

int left, right, smallest;

left = 2 * idx + 1;

right = 2 * idx + 2;

smallest = idx;

if ( left < minHeap->count &&

minHeap->array[left].head->data <

minHeap->array[smallest].head->data

)

smallest = left;

if ( right < minHeap->count &&

minHeap->array[right].head->data <

minHeap->array[smallest].head->data

)

smallest = right;

if ( smallest != idx )

{

swap( &minHeap->array[smallest], &minHeap->array[idx] );

minHeapify( minHeap, smallest );

}

}

// A utility function to check whether a Min Heap is empty or not

int isEmpty( MinHeap* minHeap )

{

return (minHeap->count == 0);

}

// A standard function to build a heap

void buildMinHeap( MinHeap* minHeap )

{

int i, n;

n = minHeap->count - 1;

for ( i = (n - 1) / 2; i >= 0; --i )

minHeapify( minHeap, i );

}

// This function inserts array elements to heap and then calls

// buildHeap for heap property among nodes

void populateMinHeap( MinHeap* minHeap, ListNode* *array, int n )

{

for ( int i = 0; i < n; ++i )

minHeap->array[ minHeap->count++ ].head = array[i];

buildMinHeap( minHeap );

}

// Return minimum element from all linked lists

ListNode* extractMin( MinHeap* minHeap )

{

if ( isEmpty( minHeap ) )

return NULL;

// The root of heap will have minimum value

MinHeapNode temp = minHeap->array[0];

// Replace root either with next node of the same list.

if ( temp.head->next )

minHeap->array[0].head = temp.head->next;

else // If list empty, then reduce heap size

{

minHeap->array[0] = minHeap->array[ minHeap->count - 1 ];

--minHeap->count;

}

minHeapify( minHeap, 0 );

return temp.head;

}

// The main function that takes an array of lists from N machines

// and generates the sorted output

void externalSort( ListNode *array[], int N )

{

// Create a min heap of size equal to number of machines

MinHeap* minHeap = createMinHeap( N );

// populate first item from all machines

populateMinHeap( minHeap, array, N );

while ( !isEmpty( minHeap ) )

{

ListNode* temp = extractMin( minHeap );

printf ( "%d " ,temp->data );

}

}

// Driver program to test above functions

int main()

{

int N = 3; // Number of machines

// an array of pointers storing the head nodes of the linked lists

ListNode *array[N];

// Create a Linked List 30->40->50 for first machine

array[0] = NULL;

push (&array[0], 50);

push (&array[0], 40);

push (&array[0], 30);

// Create a Linked List 35->45 for second machine

array[1] = NULL;

push (&array[1], 45);

push (&array[1], 35);

// Create Linked List 10->60->70->80 for third machine

array[2] = NULL;

push (&array[2], 100);

push (&array[2], 80);

push (&array[2], 70);

push (&array[2], 60);

push (&array[2], 10);

// Sort all elements

externalSort( array, N );

return 0;

}

Output:

10 30 35 40 45 50 60 70 80 100