Quark
Quark

Reputation: 399

Frequency of Node/value in a binary search tree

Given a binary search tree where there may contain duplicates, but all other logic of the BST is intact,determine the most frequently occurring element.

class TreeNode
{
public:
    TreeNode* right = NULL;
    TreeNode* left = NULL;
    int val;

    TreeNode(int value)
    {
        val = value;
    }
};

// To keep track of the frequency of the value/node
struct holder
{
public:
    TreeNode* most = NULL;
    int count = 0;
};

int frequencyOfNode(TreeNode* root, struct holder* ptr)
{
    if (root == NULL)
    {
        return 0;
    }

    int left = frequencyOfNode(root->left, ptr);
    int right = frequencyOfNode(root->right, ptr);

// need to check of left and right are nor null
    if (left != 0 && root->val == root->left->val)
    {
        return 1 + left;
    }
    else if (right != 0 && root->val == root->right->val)
    {
        return 1 + right;
    }
    else
    {
        // left has a higher frequency
        if (left >= right)
        {
            // left is bigger;
            if (left > ptr->count)
            {
                ptr->most = root->left;
                ptr->count = left;
            }
        }
        else
        {
            // right has a higher frequency
            if (right > ptr->count)
            {
                ptr->most = root->right;
                ptr->count = right;
            }
        }

        return 1;
    }
}

I am doing a post order traversal of the binary search tree. my logic works when the nodes appears in consecutive order, but if the node is not in consecutive order; the frequency of the node is reset.

my time is O(n) and space is O(1).

the issue is when the Nodes do not linked in succession.

my sample Tree:

int main()
{
    TreeNode *root = new TreeNode(6);
    root->right = new TreeNode(8);
    root->right->left = new TreeNode(7);
    root->right->right = new TreeNode(8);
    root->right->right->right = new TreeNode(8);
    root->right->right->right->right = new TreeNode(9);
    root->right->right->right->right->left = new TreeNode(8);
    root->left = new TreeNode(4);
    root->left->right = new TreeNode(5);
    root->left->right->right = new TreeNode(5);
    root->left->right->right->right = new TreeNode(5);
    root->left->left = new TreeNode(1);
    root->left->left->right = new TreeNode(1);
    root->left->left->right->right = new TreeNode(1);
    root->left->left->right->right = new TreeNode(2);
    root->left->left->left = new TreeNode(0);

    struct holder freq;
    int ran = frequencyOfNode(root, &freq);
    std::cout << "random" << ran << std::endl;

    std::cout << "The Node: " << freq.most->val << " frequency " << freq.count
            << std::endl;

    return 0;
}

I'm really confused on how to take into account, when the nodes are not consecutive( i.e 8->8->8->9->8).

Upvotes: 0

Views: 2334

Answers (1)

Andros Rex
Andros Rex

Reputation: 372

I see you have fixed some problems yourself. Anyway, I decided to solve this completely, changing a few things as well to simplify everything. It uses O(N) time and O(1) space:

#include <iostream>
#include <limits>

class TreeNode
{
public:
    TreeNode* right;
    TreeNode* left;
    int val;

    TreeNode(int value)
    {
        val = value;
        right = left = NULL;
    }
};

// To keep track of the frequency of the value/node
struct Holder
{
public:
    int value;
    int count;

    Holder(int v=std::numeric_limits<int>::min(), int c=-1): value(v), count(c) {}
};



void dfs(TreeNode* root, int &mostFrequent, int &mostFrequentCount, int &current, int &currentCount)
{
    if(root->left) dfs(root->left, mostFrequent, mostFrequentCount, current, currentCount); //first go to smaller

    int val = root->val;

    if(val == current) currentCount++;
    else { current=val; currentCount=1; }

    if(currentCount > mostFrequentCount) 
    {
        mostFrequent=current;
        mostFrequentCount=currentCount;
    }

    if(root->right) dfs(root->right, mostFrequent, mostFrequentCount, current, currentCount); //finally go to larger
}

Holder getMostFrequent(TreeNode *root)
{
    int mostFrequent=-1,mostFrequentCount=-1, current=std::numeric_limits<int>::min(), currentCount=-1;
    if(root) dfs(root, mostFrequent, mostFrequentCount, current, currentCount);

    return Holder(mostFrequent, mostFrequentCount);
}


int main()
{
    TreeNode *root = new TreeNode(6);
    root->right = new TreeNode(8);
    root->right->left = new TreeNode(7);
    root->right->right = new TreeNode(8);
    root->right->right->right = new TreeNode(8);
    root->right->right->right->right = new TreeNode(9);
    root->right->right->right->right->left = new TreeNode(8);
    root->left = new TreeNode(4);
    root->left->right = new TreeNode(5);
    root->left->right->right = new TreeNode(5);
    root->left->right->right->right = new TreeNode(5);
    root->left->left = new TreeNode(1);
    root->left->left->right = new TreeNode(1);
    root->left->left->right->right = new TreeNode(1);
    root->left->left->right->right = new TreeNode(2);
    root->left->left->left = new TreeNode(0);

    Holder h = getMostFrequent(root);

    std::cout << "most frequently encountered element: " << h.value << ", " << h.count << " times\n";


    return 0;
}

It uses the fact that since this is a BST, traversing it in the [left -> current -> right] order would result in sorted elements, that's all.

Upvotes: 2

Related Questions