kscanne · b-sai · Feb 12, 2023 · Feb 12, 2023 · Feb 12, 2023 · Feb 15, 2023
diff --git a/S23/b-sai/main.py b/S23/b-sai/main.py
@@ -0,0 +1,50 @@
+
+def to_lowercase(word: str, language: str):
+    """
+    word: str, the string to be converted to lowercase
+    language: str, the language of the string, in BCP 47 format
+    """
+    result = ""
+
+    if language.startswith(("zh", "th", "ja")):
+        return word.lower()
+
+    for idx, letter in enumerate(word):
+
+        lower_letter = letter.lower()
+        if language == 'tr' or language == 'az':
+            if letter == 'I':
+                lower_letter = 'ı'
+        elif language.startswith(('gd', 'gv', 'ga')):
+            is_2nd_letter = idx == 1
+            is_exception_letter = letter in [
+                'A', 'E', 'I', 'O', 'U', 'Á', 'É', 'Í', 'Ó', 'Ú', "Ó"]
+            is_letter_o_latin = ord(letter) in [211]
+            is_beginning_exception = word[0] in ['n', 't']
+            is_not_last = len(word)-idx > 1
+            if is_2nd_letter and (is_exception_letter or is_letter_o_latin) and is_beginning_exception and (is_not_last and ord(word[idx+1]) != 771):
+                lower_letter = "-"+letter.lower()
+        elif language.startswith('el'):
+            if letter == 'Σ' and idx == len(word)-1:
+                lower_letter = 'ς'
+
+        result += lower_letter
+
+    return result
+
+
+with open("tests.tsv", "r", encoding="utf-8") as f:
+    tests = f.read().splitlines()
+
+num_correct = 0
+for test in tests:
+    word, language, actual = test.split("\t")
+    predicted = to_lowercase(word, language)
+    if predicted != actual:
+        print(f"COuldn't convert {word} in {language}!")
+        print(f"Actual: {actual}")
+        print(f"Predicted: {predicted}")
+    else:
+        num_correct += 1
+
+print(f"Successfully completed {num_correct}/{len(tests)} tests")
diff --git a/S23/b-sai/readme.md b/S23/b-sai/readme.md
@@ -0,0 +1,5 @@
+### b-sai lowercase converter
+
+This is a simple tool to convert uppercase letters to lowercase letters in a text file in any language
+
+To run the python script simply run ```python3 main.py``` from the S23/b-sai/ directory.
diff --git a/S23/b-sai/tests.tsv b/S23/b-sai/tests.tsv
@@ -16,3 +16,10 @@ KASIM	en	kasim
 ΠΌΛΗΣ	el	πόλης
 官话	zh-Hans	官话
 ภาษาไทย	th	ภาษาไทย
+車	ja	車
+うさぎ	ja	うさぎ
+ลา	th	ลา
+ลิง	th	ลิง
+ΚΑΘΙΣΤΕ	el	καθιστε
+comPuTer_**#science	en	computer_**#science
+tACKY	en	tacky