AliMustapha commited on
Commit
9ec8f41
·
1 Parent(s): 84a5643
Files changed (1) hide show
  1. utils/data_utils.py +4 -1
utils/data_utils.py CHANGED
@@ -1,8 +1,11 @@
 
 
 
1
  from unidecode import unidecode
2
  import pandas as od
3
  import regex
4
  import unicodedata
5
-
6
  def is_most_common_char(s):
7
  max_count = len(s) * 0.90 # calculate the maximum count of a single character
8
  char_count = {} # create an empty dictionary to store character counts
 
1
+ __copyright__ = "Copyright (C) 2023 Ali Mustapha"
2
+ __license__ = "GPL-3.0-or-later"
3
+
4
  from unidecode import unidecode
5
  import pandas as od
6
  import regex
7
  import unicodedata
8
+ import re
9
  def is_most_common_char(s):
10
  max_count = len(s) * 0.90 # calculate the maximum count of a single character
11
  char_count = {} # create an empty dictionary to store character counts