NS_Generator_Mixer.py

import os

# დასამატებელია
# რიცხვების მიწერა თავში ან ბოლოში
# წლების მიწერა თავში ან ბოლოში

# დუბლიკატების მოშორება 
def remove_duplicates(input_file, output_file):
    with open(input_file, 'r', encoding='utf-8') as infile:
        lines = infile.readlines()
    
    unique_lines = set()
    
    with open(output_file, 'w', encoding='utf-8') as outfile:
        for line in lines:
            if line not in unique_lines:
                outfile.write(line)
                unique_lines.add(line)

# დაფორმატება saxeli Saxeli SAXELI
def upper_lower_Case(input_file, output_file):
    with open(input_file, 'r', encoding='utf-8') as infile:
        lines = infile.readlines()
    
    # აქ შეგიძლია დაამატო სხვადასხვა ვარიანტი
    lowercase_lines = [line.lower() for line in lines]
    first_letter_uppercase_lines = [line.capitalize() for line in lines]
    uppercase_lines = [line.upper() for line in lines]
    
    # output ში ჩაწერა
    with open(output_file, 'w', encoding='utf-8') as outfile:
        outfile.writelines(lowercase_lines)
        outfile.writelines(first_letter_uppercase_lines)
        outfile.writelines(uppercase_lines)

# დაფორმატება giorgi -> g!orgi giorg! g!org! 
####################################################################
def replace_first_occurrence(word, letter, symbol):
    return word.replace(letter, symbol, 1)

def replace_second_occurrence(word, letter, symbol):
    parts = word.split(letter, 2)
    if len(parts) == 3:
        return letter.join(parts[:2]) + symbol + parts[2]
    return word

def replace_all_occurrences(word, letter, symbol):
    return word.replace(letter, symbol)

def process_words(input_file, output_file, letter, symbol):
    with open(input_file, 'r', encoding='utf-8') as infile:
        words = [line.strip() for line in infile]
    
    with open(output_file, 'a', encoding='utf-8') as outfile:
        for word in words:
            first_replacement = replace_first_occurrence(word, letter, symbol)
            outfile.write(first_replacement + '\n')

            second_replacement = replace_second_occurrence(word, letter, symbol)
            outfile.write(second_replacement + '\n')

            all_replacement = replace_all_occurrences(word, letter, symbol)
            outfile.write(all_replacement + '\n')

# სახელებისა და გვარების შერევა 
def generate_name_surname_combinations(first, second, output_file):
    # სახელების წაკითხვა 
    with open(first, 'r', encoding='utf-8') as infile:
        names = [line.strip() for line in infile]
    
    # გვარების წაკითხვა/ Read Surnames
    with open(second, 'r', encoding='utf-8') as infile:
        surnames = [line.strip() for line in infile]
    
    # აქ შეგიძლია დაამატო კომბინაციები 
    combination1 = [f"{name}{surname}" for name in names for surname in surnames]
    combination2 = [f"{name}_{surname}" for name in names for surname in surnames]
    combination3 = [f"{name}-{surname}" for name in names for surname in surnames]
    combination4 = [f"{name}.{surname}" for name in names for surname in surnames]
    combination5 = [f"{name}/{surname}" for name in names for surname in surnames]
    combination6 = [f"{name}\{surname}" for name in names for surname in surnames]
    combination7 = [f"{name[0]}.{surname}" for name in names for surname in surnames]
    combination8 = [f"{name[0]}_{surname}" for name in names for surname in surnames]
    combination9 = [f"{name[0]}-{surname}" for name in names for surname in surnames]
    combination10 = [f"{name[0]}/{surname}" for name in names for surname in surnames]
    combination11 = [f"{name[0]}\{surname}" for name in names for surname in surnames]
    combination12 = [f"{name[0]}_{surname}" for name in names for surname in surnames]
    combination13 = [f"{name[0]}{surname}" for name in names for surname in surnames]
    combination14 = [f"{name}da{surname}" for name in names for surname in surnames]
    

    with open(output_file, 'w', encoding='utf-8') as outfile:
        outfile.write("\n".join(combination1) + "\n")
        outfile.write("\n".join(combination2) + "\n")
        outfile.write("\n".join(combination3) + "\n")
        outfile.write("\n".join(combination4) + "\n")
        outfile.write("\n".join(combination5) + "\n")
        outfile.write("\n".join(combination6) + "\n")
        outfile.write("\n".join(combination7) + "\n")
        outfile.write("\n".join(combination8) + "\n")
        outfile.write("\n".join(combination9) + "\n")
        outfile.write("\n".join(combination10) + "\n")
        outfile.write("\n".join(combination11) + "\n")
        outfile.write("\n".join(combination12) + "\n")
        outfile.write("\n".join(combination13) + "\n")
        outfile.write("\n".join(combination14) + "\n")


# წაშლის 8 ზე ნაკლებ ასოიან სიტყვებს
def remove_short_words(input_file, output_file, min_length=8):
    with open(input_file, 'r', encoding='utf-8') as infile:
        lines = infile.readlines()

    filtered_lines = [line for line in lines if len(line.strip()) >= min_length]

    with open(output_file, 'w', encoding='utf-8') as outfile:
        outfile.writelines(filtered_lines)

# ამატებს პირველი კობინაციების ფაილს მეორე კომბინაციების ფაილს 
def append_file_data(file1, file2, output_file):
    with open(file1, 'r', encoding='utf-8') as infile1:
        lines1 = infile1.readlines()
    
    with open(file2, 'r', encoding='utf-8') as infile2:
        lines2 = infile2.readlines()
    
    combined_lines = lines1 + lines2
    
    with open(output_file, 'w', encoding='utf-8') as outfile:
        outfile.writelines(combined_lines)



                                            # ფუნქციების გამოძახების ნაწილი

# დუბლიკატების მოშორება უნიკალური სახელებიდან და გვარებიდან
input_file = r'Surnames\Surnames.txt'
output_file = r'Surnames\Unique_Surnames.txt'
remove_duplicates(input_file, output_file)

input_file = r'Names\Names.txt'
output_file = r'Names\Unique_Names.txt'
remove_duplicates(input_file, output_file)


# დაფორმატება saxeli Saxeli SAXELI
input_file = r'Surnames\Unique_Surnames.txt'
output_file = r'Surnames\Unique_Surnames.txt'
upper_lower_Case(input_file, output_file)

input_file = r'Names\Unique_Names.txt'
output_file = r'Names\Unique_Names.txt'
upper_lower_Case(input_file, output_file)


# აქ შეგიძლია დაამატო კიდევ რა ასოები გინდა რომ შეიცვალოს სხვადასხვა სიმბოლოთი
# პირველად წერ ასოს რომელიც გინდა შეიცვალოს და მეორედ სიმბოლოს რომლითაც გინდა რომ შეიცვალოს
input_file = r'Names/Unique_Names.txt'   
output_file = r'Names/Unique_Names.txt'
process_words(input_file, output_file, 'i', '!')
process_words(input_file, output_file, 'e', '3')
process_words(input_file, output_file, 'o', '0')

input_file = r'Surnames/Unique_Surnames.txt'   
output_file = r'Surnames/Unique_Surnames.txt'
process_words(input_file, output_file, 'i', '!')
process_words(input_file, output_file, 'e', '3')
process_words(input_file, output_file, 'o', '0')
####################################################################


# დუბლიკატების მეორედ მოშორება
input_file = r'Surnames\Unique_Surnames.txt'
output_file = r'Surnames\Unique_Surnames.txt'
remove_duplicates(input_file, output_file)

input_file = r'Names\Unique_Names.txt'
output_file = r'Names\Unique_Names.txt'
remove_duplicates(input_file, output_file)


# სახელების და გვარების შერევა
first = r'Names\Unique_Names.txt'
second = r'Surnames\Unique_Surnames.txt'
output_file = r'combinations.txt'
generate_name_surname_combinations(first, second, output_file)

first = r'Surnames\Unique_Surnames.txt'
second = r'Names\Unique_Names.txt'
output_file = r'combinations1.txt'
generate_name_surname_combinations(first, second, output_file)

# შლის 8 ზე ნაკლებ ასოიან სიტყვებს
input_file = r'combinations.txt'
output_file = r'filtered_combinations.txt'
remove_short_words(input_file, output_file)

input_file = r'combinations1.txt'
output_file = r'filtered_combinations1.txt'
remove_short_words(input_file, output_file)

# ყველა კომბინაციიდან ქმნის ერთ საბოლოო ფაილს
file1 = r'filtered_combinations.txt'
file2 = r'filtered_combinations1.txt'
output_file = r'FullWordlist.txt'
append_file_data(file1, file2, output_file)


# დროებითი ფაილების წაშლა
def remove_temp_files():
    os.remove(r'Names/Unique_Names.txt')
    os.remove(r'Surnames/Unique_Surnames.txt')
    os.remove(r'combinations.txt')
    os.remove(r'combinations1.txt')
    os.remove(r'filtered_combinations.txt')
    os.remove(r'filtered_combinations1.txt')
# ეს შეგიძლია დააკომენტარო რათა დროებითი ფაილები არ წაიშალოს
remove_temp_files()