Open In App

Count of subarrays having exactly K distinct elements

Improve
Improve
Like Article
Like
Save
Share
Report

Given an array arr[] of size N and an integer K. The task is to find the count of subarrays such that each subarray has exactly K distinct elements.

Examples:

Input: arr[] = {2, 1, 2, 1, 6}, K = 2 
Output:
{2, 1}, {1, 2}, {2, 1}, {1, 6}, {2, 1, 2}, 
{1, 2, 1} and {2, 1, 2, 1} are the only valid subarrays.

Input: arr[] = {1, 2, 3, 4, 5}, K = 1 
Output:

Approach: To directly count the subarrays with exactly K different integers is hard but to find the count of subarrays with at most K different integers is easy. So the idea is to find the count of subarrays with at most K different integers, let it be C(K), and the count of subarrays with at most (K – 1) different integers, let it be C(K – 1) and finally take their difference, C(K) – C(K – 1) which is the required answer. 
Count of subarrays with at most K different elements can be easily calculated through the sliding window technique. The idea is to keep expanding the right boundary of the window till the count of distinct elements in the window is less than or equal to K and when the count of distinct elements inside the window becomes more than K, start shrinking the window from the left till the count becomes less than or equal to K. Also for every expansion, keep counting the subarrays as right – left + 1 where right and left are the boundaries of the current window.

Below is the implementation of the above approach:

C++




// C++ implementation of the approach
#include<bits/stdc++.h>
#include<map>
using namespace std;
 
 
// Function to return the count of subarrays
// with at most K distinct elements using
// the sliding window technique
int atMostK(int arr[], int n, int k)
{
 
    // To store the result
    int count = 0;
 
    // Left boundary of window
    int left = 0;
 
    // Right boundary of window
    int right = 0;
 
    // Map to keep track of number of distinct
    // elements in the current window
    unordered_map<int,int> map;
    // Loop to calculate the count
    while (right < n) {
 
        // Calculating the frequency of each
        // element in the current window
        if (map.find(arr[right])==map.end())
            map[arr[right]]=0;
        map[arr[right]]++;
 
        // Shrinking the window from left if the
        // count of distinct elements exceeds K
        while (map.size() > k) {
            map[arr[left]]= map[arr[left]] - 1;
            if (map[arr[left]] == 0)
                map.erase(arr[left]);
            left++;
        }
 
        // Adding the count of subarrays with at most
        // K distinct elements in the current window
        count += right - left + 1;
        right++;
    }
    return count;
}
 
// Function to return the count of subarrays
// with exactly K distinct elements
int exactlyK(int arr[], int n, int k)
{
 
    // Count of subarrays with exactly k distinct
    // elements is equal to the difference of the
    // count of subarrays with at most K distinct
    // elements and the count of subararys with
    // at most (K - 1) distinct elements
    return (atMostK(arr, n, k) - atMostK(arr, n, k - 1));
}
 
// Driver code
int main()
{
    int arr[] = { 2, 1, 2, 1, 6 };
    int n = sizeof(arr)/sizeof(arr[0]);
    int k = 2;
 
    cout<<(exactlyK(arr, n, k));
}


Java




// Java implementation of the approach
import java.util.*;
 
public class GfG {
 
    // Function to return the count of subarrays
    // with at most K distinct elements using
    // the sliding window technique
    private static int atMostK(int arr[], int n, int k)
    {
 
        // To store the result
        int count = 0;
 
        // Left boundary of window
        int left = 0;
 
        // Right boundary of window
        int right = 0;
 
        // Map to keep track of number of distinct
        // elements in the current window
        HashMap<Integer, Integer> map = new HashMap<>();
 
        // Loop to calculate the count
        while (right < n) {
 
            // Calculating the frequency of each
            // element in the current window
            map.put(arr[right],
                    map.getOrDefault(arr[right], 0) + 1);
 
            // Shrinking the window from left if the
            // count of distinct elements exceeds K
            while (map.size() > k) {
                map.put(arr[left], map.get(arr[left]) - 1);
                if (map.get(arr[left]) == 0)
                    map.remove(arr[left]);
                left++;
            }
 
            // Adding the count of subarrays with at most
            // K distinct elements in the current window
            count += right - left + 1;
            right++;
        }
        return count;
    }
 
    // Function to return the count of subarrays
    // with exactly K distinct elements
    private static int exactlyK(int arr[], int n, int k)
    {
 
        // Count of subarrays with exactly k distinct
        // elements is equal to the difference of the
        // count of subarrays with at most K distinct
        // elements and the count of subararys with
        // at most (K - 1) distinct elements
        return (atMostK(arr, n, k)
                - atMostK(arr, n, k - 1));
    }
 
    // Driver code
    public static void main(String[] args)
    {
        int arr[] = { 2, 1, 2, 1, 6 };
        int n = arr.length;
        int k = 2;
 
        System.out.print(exactlyK(arr, n, k));
    }
}


Python3




# Python3 implementation of the above approach
 
# Function to return the count of subarrays
# with at most K distinct elements using
# the sliding window technique
 
 
def atMostK(arr, n, k):
 
    # To store the result
    count = 0
 
    # Left boundary of window
    left = 0
 
    # Right boundary of window
    right = 0
 
    # Map to keep track of number of distinct
    # elements in the current window
    map = {}
 
    # Loop to calculate the count
    while(right < n):
 
        if arr[right] not in map:
            map[arr[right]] = 0
 
        # Calculating the frequency of each
        # element in the current window
        map[arr[right]] += 1
 
        # Shrinking the window from left if the
        # count of distinct elements exceeds K
        while(len(map) > k):
 
            if arr[left] not in map:
                map[arr[left]] = 0
 
            map[arr[left]] -= 1
 
            if map[arr[left]] == 0:
                del map[arr[left]]
 
            left += 1
 
        # Adding the count of subarrays with at most
        # K distinct elements in the current window
        count += right - left + 1
        right += 1
 
    return count
 
# Function to return the count of subarrays
# with exactly K distinct elements
 
 
def exactlyK(arr, n, k):
 
    # Count of subarrays with exactly k distinct
    # elements is equal to the difference of the
    # count of subarrays with at most K distinct
    # elements and the count of subararys with
    # at most (K - 1) distinct elements
    return (atMostK(arr, n, k) -
            atMostK(arr, n, k - 1))
 
 
# Driver code
if __name__ == "__main__":
    arr = [2, 1, 2, 1, 6]
    n = len(arr)
    k = 2
 
    print(exactlyK(arr, n, k))
 
# This code is contributed by AnkitRai01


C#




// C# implementation of the approach
using System;
using System.Collections.Generic;
 
class GfG {
 
    // Function to return the count of subarrays
    // with at most K distinct elements using
    // the sliding window technique
    private static int atMostK(int[] arr, int n, int k)
    {
 
        // To store the result
        int count = 0;
 
        // Left boundary of window
        int left = 0;
 
        // Right boundary of window
        int right = 0;
 
        // Map to keep track of number of distinct
        // elements in the current window
        Dictionary<int, int> map
            = new Dictionary<int, int>();
 
        // Loop to calculate the count
        while (right < n) {
 
            // Calculating the frequency of each
            // element in the current window
            if (map.ContainsKey(arr[right]))
                map[arr[right]] = map[arr[right]] + 1;
            else
                map.Add(arr[right], 1);
 
            // Shrinking the window from left if the
            // count of distinct elements exceeds K
            while (map.Count > k) {
                if (map.ContainsKey(arr[left])) {
                    map[arr[left]] = map[arr[left]] - 1;
                    if (map[arr[left]] == 0)
                        map.Remove(arr[left]);
                }
                left++;
            }
 
            // Adding the count of subarrays with at most
            // K distinct elements in the current window
            count += right - left + 1;
            right++;
        }
        return count;
    }
 
    // Function to return the count of subarrays
    // with exactly K distinct elements
    private static int exactlyK(int[] arr, int n, int k)
    {
 
        // Count of subarrays with exactly k distinct
        // elements is equal to the difference of the
        // count of subarrays with at most K distinct
        // elements and the count of subararys with
        // at most (K - 1) distinct elements
        return (atMostK(arr, n, k)
                - atMostK(arr, n, k - 1));
    }
 
    // Driver code
    public static void Main(String[] args)
    {
        int[] arr = { 2, 1, 2, 1, 6 };
        int n = arr.Length;
        int k = 2;
 
        Console.Write(exactlyK(arr, n, k));
    }
}
 
// This code is contributed by 29AjayKumar


Javascript




<script>
 
// Javascript implementation of the approach
 
// Function to return the count of subarrays
// with at most K distinct elements using
// the sliding window technique
function atMostK(arr, n, k)
{
    // To store the result
    let count = 0;
 
    // Left boundary of window
    let left = 0;
 
    // Right boundary of window
    let right = 0;
 
    // Map to keep track of number of distinct
    // elements in the current window
    let map = new Map();
 
    // Loop to calculate the count
    while (right < n)
    {
         
        // Calculating the frequency of each
        // element in the current window
        if (map.has(arr[right]))
            map.set(arr[right],
            map.get(arr[right]) + 1);
        else
            map.set(arr[right], 1);
 
        // Shrinking the window from left if the
        // count of distinct elements exceeds K
        while (map.size > k)
        {
            map.set(arr[left], map.get(arr[left]) - 1);
            if (map.get(arr[left]) == 0)
                map.delete(arr[left]);
                 
            left++;
        }
 
        // Adding the count of subarrays with at most
        // K distinct elements in the current window
        count += right - left + 1;
        right++;
    }
    return count;
}
 
// Function to return the count of subarrays
// with exactly K distinct elements
function exactlyK(arr, n, k)
{
     
    // Count of subarrays with exactly k distinct
    // elements is equal to the difference of the
    // count of subarrays with at most K distinct
    // elements and the count of subararys with
    // at most (K - 1) distinct elements
    return (atMostK(arr, n, k) -
            atMostK(arr, n, k - 1));
}
 
// Driver code
let arr = [ 2, 1, 2, 1, 6 ];
let n = arr.length;
let k = 2;
 
document.write(exactlyK(arr, n, k));
 
// This code is contributed by avanitrachhadiya2155
 
</script>


Output

7

Time Complexity: O(N) 
Space Complexity: O(N)

Another Approach: When you move the right cursor, keep tracking whether we have reach a count of K distinct integers, if yes, we process left cursor, here is how we process left cursor:

  • check whether the element pointed by the left cursor is duplicated in the window, if yes, we remove it, and use a variable (e.g. prefix) to record that we have removed an element from the window). keep this process until we reduce the window size from to exactly K. now we can calculate the number of the valid good array as res += prefix;
  • after process left cursor and all the stuff, the outer loop will continue and the right cursor will move forward, and then the window size will exceed K, we can simply drop the leftmost element of the window and reset prefix to 0. and continue on. 
     

 Below is the implementation of the above approach: 

C++




// C++ program to calculate number
// of subarrays with distinct elements of size k
#include <bits/stdc++.h>
#include <map>
#include <vector>
using namespace std;
 
int subarraysWithKDistinct(vector<int>& A, int K)
{
   
    // declare a map for the frequency
    unordered_map<int, int> mapp;
    int begin = 0, end = 0, prefix = 0, cnt = 0;
    int res = 0;
   
    // traverse the array
    while (end < A.size())
    {
        // increase the frequency
        mapp[A[end]]++;
        if (mapp[A[end]] == 1) {
            cnt++;
        }
        end++;
        if (cnt > K)
        {
            mapp[A[begin]]--;
            begin++;
            cnt--;
            prefix = 0;
        }
       
        // loop until mapp[A[begin]] > 1
        while (mapp[A[begin]] > 1)
        {
            mapp[A[begin]]--;
            begin++;
            prefix++;
        }
        if (cnt == K)
        {
            res += prefix + 1;
        }
    }
   
    // return the final count
    return res;
}
// Driver code
int main()
{
    vector<int> arr{ 2, 1, 2, 1, 6 };
    int k = 2;
 
     // Function call
    cout << (subarraysWithKDistinct(arr, k));
}
// This code is contributed by Harman Singh


Java




// Java program to calculate number
// of subarrays with distinct elements of size k
import java.util.*;
class GFG
{
  static int subarraysWithKDistinct(int A[], int K)
  {
 
    // declare a map for the frequency
    HashMap<Integer, Integer> mapp = new HashMap<>();
    int begin = 0, end = 0, prefix = 0, cnt = 0;
    int res = 0;
 
    // traverse the array
    while (end < A.length)
    {
 
      // increase the frequency
      if(mapp.containsKey(A[end]))
      {
        mapp.put(A[end], mapp.get(A[end]) + 1);
      }
      else
      {
        mapp.put(A[end], 1);
      }
      if (mapp.get(A[end]) == 1)
      {
        cnt++;
      }
      end++;
      if (cnt > K)
      {
        if(mapp.containsKey(A[begin]))
        {
          mapp.put(A[begin], mapp.get(A[begin]) - 1);
        }
        else
        {
          mapp.put(A[begin], -1);
        }
        begin++;
        cnt--;
        prefix = 0;
      }
 
      // loop until mapp[A[begin]] > 1
      while (mapp.get(A[begin]) > 1)
      {
        if(mapp.containsKey(A[begin]))
        {
          mapp.put(A[begin], mapp.get(A[begin]) - 1);
        }
        else
        {
          mapp.put(A[begin], -1);
        }
        begin++;
        prefix++;
      }
      if (cnt == K)
      {
        res += prefix + 1;
      }
    }
 
    // return the final count
    return res;
  }
 
  // Driver code
  public static void main(String[] args)
  {
    int arr[] = { 2, 1, 2, 1, 6 };
    int k = 2;
 
    // Function call
    System.out.println(subarraysWithKDistinct(arr, k));
  }
}
 
// This code is contributed by divyeshrabadiya07


Python3




# Python3 program to calculate number of
# subarrays with distinct elements of size k
def subarraysWithKDistinct(A, K):
     
    # Declare a map for the frequency
    mapp = {}
    begin, end, prefix, cnt = 0, 0, 0, 0
    res = 0
     
    # Traverse the array
    while (end < len(A)):
         
        # Increase the frequency
        mapp[A[end]] = mapp.get(A[end], 0) + 1
         
        if (mapp[A[end]] == 1):
            cnt += 1
 
        end += 1
         
        if (cnt > K):
            mapp[A[begin]] -= 1
            begin += 1
            cnt -= 1
            prefix = 0
 
        # Loop until mapp[A[begin]] > 1
        while (mapp[A[begin]] > 1):
            mapp[A[begin]] -= 1
            begin += 1
            prefix += 1
 
        if (cnt == K):
            res += prefix + 1
 
    # Return the final count
    return res
 
# Driver code
if __name__ == '__main__':
     
    arr = [ 2, 1, 2, 1, 6 ]
    k = 2
     
    # Function call
    print (subarraysWithKDistinct(arr, k))
     
# This code is contributed by Mohit kumar


C#




// C# program to calculate number
// of subarrays with distinct elements of size k
using System;
using System.Collections.Generic;
class GFG {
     
    static int subarraysWithKDistinct(List<int> A, int K)
    {
        
        // declare a map for the frequency
        Dictionary<int, int> mapp = new Dictionary<int, int>(); 
        int begin = 0, end = 0, prefix = 0, cnt = 0;
        int res = 0;
        
        // traverse the array
        while (end < A.Count)
        {
           
            // increase the frequency
            if(mapp.ContainsKey(A[end]))
            {
                mapp[A[end]]++;
            }
            else{
                mapp[A[end]] = 1;
            }
            if (mapp[A[end]] == 1) {
                cnt++;
            }
            end++;
            if (cnt > K)
            {
                if(mapp.ContainsKey(A[begin]))
                {
                    mapp[A[begin]]--;
                }
                else{
                    mapp[A[begin]] = -1;
                }
                begin++;
                cnt--;
                prefix = 0;
            }
            
            // loop until mapp[A[begin]] > 1
            while (mapp[A[begin]] > 1)
            {
                mapp[A[begin]]--;
                begin++;
                prefix++;
            }
            if (cnt == K)
            {
                res += prefix + 1;
            }
        }
        
        // return the final count
        return res;
    }
 
  // Driver code
  static void Main()
  {
    List<int> arr = new List<int>(new int[] { 2, 1, 2, 1, 6 });
    int k = 2;
  
     // Function call
    Console.Write(subarraysWithKDistinct(arr, k));
  }
}
 
// This code is contributed by divyesh072019


Javascript




<script>
 
// Javascript program to calculate number
// of subarrays with distinct elements of size k
function subarraysWithKDistinct(A, K)
{
     
    // Declare a map for the frequency
    let mapp = new Map();
    let begin = 0, end = 0, prefix = 0, cnt = 0;
    let res = 0;
  
    // Traverse the array
    while (end < A.length)
    {
      
        // increase the frequency
        if (mapp.has(A[end]))
        {
            mapp.set(A[end],
            mapp.get(A[end]) + 1);
        }
        else
        {
            mapp.set(A[end], 1);
        }
        if (mapp.get(A[end]) == 1)
        {
            cnt++;
        }
        end++;
        if (cnt > K)
        {
            if (mapp.has(A[begin]))
            {
                mapp.set(A[begin],
                mapp.get(A[begin]) - 1);
            }
            else
            {
                mapp.set(A[begin], -1);
            }
            begin++;
            cnt--;
            prefix = 0;
        }
     
        // loop until mapp[A[begin]] > 1
        while (mapp.get(A[begin]) > 1)
        {
            if(mapp.has(A[begin]))
            {
                mapp.set(A[begin],
                mapp.get(A[begin]) - 1);
            }
            else
            {
                mapp.set(A[begin], -1);
            }
            begin++;
            prefix++;
        }
        if (cnt == K)
        {
            res += prefix + 1;
        }
    }
     
    // Return the final count
    return res;
}
 
// Driver code
let arr = [ 2, 1, 2, 1, 6 ];
let k = 2;
 
// Function call
document.write(subarraysWithKDistinct(arr, k));
 
// This code is contributed by rag2127
 
</script>


Output

7

Time Complexity: O(N)
Auxiliary Space: O(N)

Optimized Sliding window :

Approach :

Iterate the array and perform these steps :
 
1. Just count the number of distinct numbers with each iteration.
2. If equals k then check the subarrays which can be formed with the elements between i and j.
3. If greater than k, then move i pointer with decresing number of elements in array and count too.

Then return the sum of subarrays.  

Java




/*package whatever //do not write package name here */
 
import java.io.*;
 
class GFG {
      public static int subarraysWithKDistinct(int[] nums, int k) {
        int n = nums.length;
 
        int i = 0;
        int j = 0;
        int count = 0;
        int ans = 0;
        int []arr = new int[n + 5];
        while(j < n){
            arr[nums[j]]++;
            if(arr[nums[j]] == 1){
                count++;
            }
 
            while(count > k){
                arr[nums[i]]--;
                if(arr[nums[i]] == 0){
                    count--;
                }
                i++;
            }
 
            if(count == k){
                int val = i;
                while(count == k){
                    ans++;
 
                    int num = nums[val];
                    arr[num]--;
                    if(arr[num] == 0){
                        count--;
                    }
                    val++;
                }
 
                val--;
                while(val >= i){
                    int num = nums[val];
                    arr[num]++;
                    if(arr[num] == 1){
                        count++;
                    }
                    val--;
                }
            }
            j++;
        }
 
        return ans;
    }
    public static void main (String[] args) {
        int arr[] = { 2, 1, 2, 1, 6 };
        int k = 2;
  
        // Function call
        System.out.println(subarraysWithKDistinct(arr, k));
    }
}


Python3




class GFG:
    def subarraysWithKDistinct(nums, k):
        n = len(nums)
        i = 0
        j = 0
        count = 0
        ans = 0
        arr = [0]*(n+5)
        while(j < n):
            arr[nums[j]] += 1
            if(arr[nums[j]] == 1):
                count += 1
            while(count > k):
                arr[nums[i]] -= 1
                if(arr[nums[i]] == 0):
                    count -= 1
                i += 1
            if(count == k):
                val = i
                while(count == k):
                    ans += 1
                    num = nums[val]
                    arr[num] -= 1
                    if(arr[num] == 0):
                        count -= 1
                    val += 1
                val -= 1
                while(val >= i):
                    num = nums[val]
                    arr[num] += 1
                    if(arr[num] == 1):
                        count += 1
                    val -= 1
            j += 1
        return ans
 
# Test the code
arr = [2, 1, 2, 1, 6]
k = 2
print(GFG.subarraysWithKDistinct(arr, k))


C++




#include <bits/stdc++.h>
using namespace std;
 
int subarraysWithKDistinct(int nums[], int n, int k) {
    int i = 0, j = 0, count = 0, ans = 0;
    int arr[n + 5] = {0};
 
    while(j < n) {
        arr[nums[j]]++;
        if(arr[nums[j]] == 1)
            count++;
 
        while(count > k) {
            arr[nums[i]]--;
            if(arr[nums[i]] == 0)
                count--;
            i++;
        }
 
        if(count == k) {
            int val = i;
            while(count == k) {
                ans++;
                int num = nums[val];
                arr[num]--;
                if(arr[num] == 0)
                    count--;
                val++;
            }
 
            val--;
            while(val >= i) {
                int num = nums[val];
                arr[num]++;
                if(arr[num] == 1)
                    count++;
                val--;
            }
        }
        j++;
    }
 
    return ans;
}
 
int main() {
    int arr[] = {2, 1, 2, 1, 6};
    int n = sizeof(arr) / sizeof(arr[0]);
    int k = 2;
     
    // Function call
    cout << subarraysWithKDistinct(arr, n, k) << endl;
 
    return 0;
}


C#




using System;
 
public class GFG {
    public static int SubarraysWithKDistinct(int[] nums, int k) {
        int n = nums.Length;
 
        int i = 0;
        int j = 0;
        int count = 0;
        int ans = 0;
        int[] arr = new int[n + 5];
        while (j < n) {
            arr[nums[j]]++;
            if (arr[nums[j]] == 1) {
                count++;
            }
 
            while (count > k) {
                arr[nums[i]]--;
                if (arr[nums[i]] == 0) {
                    count--;
                }
                i++;
            }
 
            if (count == k) {
                int val = i;
                while (count == k) {
                    ans++;
 
                    int num = nums[val];
                    arr[num]--;
                    if (arr[num] == 0) {
                        count--;
                    }
                    val++;
                }
 
                val--;
                while (val >= i) {
                    int num = nums[val];
                    arr[num]++;
                    if (arr[num] == 1) {
                        count++;
                    }
                    val--;
                }
            }
            j++;
        }
 
        return ans;
    }
 
    public static void Main(string[] args) {
        int[] arr = { 2, 1, 2, 1, 6 };
        int k = 2;
 
        // Function call
        Console.WriteLine(SubarraysWithKDistinct(arr, k));
    }
}


Javascript




function subarraysWithKDistinct(nums, k) {
    const n = nums.length;
    let i = 0;
    let j = 0;
    let count = 0;
    let ans = 0;
    const arr = new Array(n + 5).fill(0);
     
    while(j < n) {
        arr[nums[j]]++;
        if(arr[nums[j]] == 1) {
            count++;
        }
         
        while(count > k) {
            arr[nums[i]]--;
            if(arr[nums[i]] == 0) {
                count--;
            }
            i++;
        }
         
        if(count == k) {
            let val = i;
            while(count == k) {
                ans++;
                const num = nums[val];
                arr[num]--;
                if(arr[num] == 0) {
                    count--;
                }
                val++;
            }
             
            val--;
            while(val >= i) {
                const num = nums[val];
                arr[num]++;
                if(arr[num] == 1) {
                    count++;
                }
                val--;
            }
        }
        j++;
    }
     
    return ans;
}
 
const arr = [2, 1, 2, 1, 6];
const k = 2;
console.log(subarraysWithKDistinct(arr, k));


Output

7

Time Complexity : O(N)
Auxiliary Space : O(N)



Last Updated : 04 Apr, 2023
Like Article
Save Article
Previous
Next
Share your thoughts in the comments
Similar Reads