Constrained-Text-Generation-Studio.py

import random
import re
import string
import time as time
from collections import Counter
import numpy as np

import dearpygui.dearpygui as dpg
import fasttext
import pronouncing
import torch
from huggingface_hub import hf_hub_download
from scipy import spatial
from torch.nn import functional as F
from transformers import (AutoModelForCausalLM, AutoModelForQuestionAnswering,
                          AutoModelForSeq2SeqLM,
                          AutoModelForSequenceClassification, AutoTokenizer,
                          GPT2Tokenizer, LogitsProcessor, LogitsProcessorList,
                          pipeline, top_k_top_p_filtering)
from screeninfo import get_monitors

##TODO: Allow more semantic, phonetic, lexical models (Maybe allow specification of fasttext weights, dropdown select some phonetic models)
##TODO: Loading Bars when loading model, and when generating text
##TODO: Allow the user to decide to regenerate new predictions with a right click?
##TODO: Button for loading Masked Language Models, and then displaying the tokenizer masking character, enabling the user to right click and to tab
##TODO: Proper layout somehow
##TODO: "novalty generation constraints" like pilish (specify list of word lengths) or pangram/perfect pangram generation

starttime = time.time()

fasttext_model = fasttext.load_model(hf_hub_download("osanseviero/fasttext_embedding", "model.bin"))


tokenizer = ""
model = ""

def add_and_load_image(image_path, parent=None):
    width, height, channels, data = dpg.load_image(image_path)

    with dpg.texture_registry() as reg_id:
        texture_id = dpg.add_static_texture(width, height, data, parent=reg_id)

    if parent is None:
        return dpg.add_image(texture_id)
    else:
        return dpg.add_image(texture_id, parent=parent)

def _help(message):
    last_item = dpg.last_item()
    group = dpg.add_group(horizontal=True)
    dpg.move_item(last_item, parent=group)
    dpg.capture_next_item(lambda s: dpg.move_item(s, parent=group))
    t = dpg.add_text("(?)", color=[0, 255, 0])
    with dpg.tooltip(t):
        dpg.add_text(message)

def load_model(the_name):
    global tokenizer
    global model
    if the_name == "load_model":
        model_name = dpg.get_value("model_name")
    else:
        model_name = the_name
    tokenizer = AutoTokenizer.from_pretrained(model_name)
    if dpg.get_value("percision") == "8bit":
        model = AutoModelForCausalLM.from_pretrained(model_name, device_map='auto', load_in_8bit=True)
    elif dpg.get_value("percision") == "16bit":
        model = AutoModelForCausalLM.from_pretrained(model_name, device_map='auto', load_in_8bit=False, torch_dtype=torch.float16)
    else:
        model = AutoModelForCausalLM.from_pretrained(model_name, device_map='auto', load_in_8bit=False)
    if torch.cuda.is_available():
        loaded_model_string = model_name + " Loaded Succesfully onto the GPU" + " with " + dpg.get_value("percision") + " percision"
        dpg.add_text(parent = "load_model_window", default_value = loaded_model_string)
    else:
        loaded_model_string = model_name + " Loaded Succesfully onto the CPU" + " with " + dpg.get_value("percision") + " percision"
        dpg.add_text(parent = "load_model_window", default_value = loaded_model_string)



########--------------------------------------------------------------#### Filters ########--------------------------------------------------------------####

def all_letters_included(word, string_list):
    return all(c in word[0] for c in string_list)


def any_letters_included(word, string_list):
    return any(c in string_list for c in word[0])

def all_letters_not_included(word, string_list):
    #any(c in letters for c in word)
    return all(c not in word[0] for c in string_list)

def any_letters_not_included(word, string_list):
    ## "e.g. not words with both B and T in them!"
    return any(c not in string_list for c in word[0])

def equal_to_length(word, word_length):
    return len(word[0]) == word_length


def greater_than_length(word, word_length):
    return len(word[0]) > word_length

def less_than_length(word, word_length):
    return len(word[0]) < word_length

def ends_with(word, ending_string,  start = None, end = None):
    return word[0].endswith(ending_string, start, end)

def starts_with(word, starting_string, start = None, end = None):
    return word[0].startswith(starting_string, start, end)

def string_in_position(word, a_string_list, position_index_list):
    for idx, string in enumerate(a_string_list):
        try:
            if word[0][position_index_list[idx]] != string:
                return False
        except:
            return False
    return True

def phonetic_matching(word, phonetic_matching_string):
    if pe.encode(word[0]) == pe.encode(phonetic_matching_string):
        return True
    else:
        return False

def string_edit(word, string_edit_string, string_edit_threshold):
    if cmp.dist_abs(word[0], string_edit_string) <= string_edit_threshold:
        return True
    else:
        return False



def semantic_matching(word, semantic_string, semantic_threshold):
    word_word_vector = fasttext_model.get_word_vector(word[0])
    semantic_string_vector = fasttext_model.get_word_vector(semantic_string)
    similarity = 1 - spatial.distance.cosine(word_word_vector, semantic_string_vector)
    if similarity >= semantic_threshold:
        return True
    else: 
        return False


def rhyme(word, rhyme_string):
    the_string = word[0]
    if the_string in pronouncing.rhymes(rhyme_string):
        return True
    else:
        return False


def meter(word, meter_string):
    the_string = word[0]
    phones_list = pronouncing.phones_for_word(meter_string)
    meter_string_stress = pronouncing.stresses(phones_list[0])
    word_phones_list = pronouncing.phones_for_word(the_string)
    if len(word_phones_list) > 0:
        word_stress = pronouncing.stresses(word_phones_list[0])
        if word_stress == meter_string_stress:
            return True
        else:
            return False
    else:
        return False

def syllable(word, syllable_number):
    the_string = word[0]
    phones_list = pronouncing.phones_for_word(the_string)
    if len(phones_list) > 0:
        syllable_count = pronouncing.syllable_count(phones_list[0])
        if syllable_count == syllable_number:
            return True
        else:
            return False
    else:
        return False




def palindrome(word):
    the_string = word[0]
    if the_string == the_string[::-1]:
        return True
    else:
        return False

def partial_anagram(word, a_string):
    ###Like a full anagram but allows anagramic substrings
    if Counter(word[0]) - Counter(a_string):
         return False
    return True

def full_anagram(word, a_string):
    ### Only true anagrams!
    if Counter(word[0]) == Counter(a_string):
        return True
    else:
        return False

def isogram(word, count = 1):
    ##Allow user to optionally specify list of characters to isolate
    for char in word[0]:
        if word[0].count(char) > count:
            return False
    return True

def reverse_isogram(word, count = 1):
    ##Allow user to optionally specify list of characters to isolate
    for char in word[0]:
        if word[0].count(char) < count:
            return False
    return True


"""

Ideas 

1. Longest repeating and non overlapping substring in a string
2. List of strings to consume from, like a pangram but you specify the alphabet
3. Edit Distance of strings, user supplies string and max distance and it returns strings with that distance. I think this is fast enough to calculate for this to work!

Leetcode stuff like this

Find longest palindroming substring
def countSubstrings(self, s: str) -> int:
        @cache
        def isPalindrome(i, j):
            return i >= j or s[i] == s[j] and isPalindrome(i + 1, j - 1)
        return sum(isPalindrome(i, j) for i in range(len(s)) for j in range(i, len(s)))

"""

########--------------------------------------------------------------####          ########--------------------------------------------------------------####


lipogram_naughty_word_list = []
weak_lipogram_naughty_word_list = []
reverse_lipogram_nice_word_list = []
weak_reverse_lipogram_nice_word_list = []
string_in_positon_list = []
string_in_positon_index_list = []
starts_with_string = ""
ends_with_string = ""
phonetic_matching_string = ""
semantic_matching_string = ""
semantic_distance_threshold = 0.0
string_edit_string = ""
string_edit_distnace_threhold = 0
syllable_number = 0
meter_string = ""
rhyme_string = ""
constrained_length = 0
constrained_gt_length = 0
constrained_lt_length = 0
palindrome_enabled = False
anagram_string = ""
partial_anagram_string = ""
isogram_count = 0
reverse_isogram_count = 0



def get_next_word_without_e(sequence):
    all_letters_filtered_list = []
    with torch.no_grad():
        input_ids = tokenizer.encode(sequence, return_tensors="pt")
        # get logits of last hidden state
        next_token_candidates_logits = model(input_ids)[0][:, -1, :]
        temperature = dpg.get_value("temperature")
        if temperature != 1.0:
            next_token_candidates_logits = next_token_candidates_logits / temperature
        # filter
        top_p = dpg.get_value("top_p")
        top_k = dpg.get_value("top_k")
        if (top_p > 0 and top_k > 0):
            filtered_next_token_candidates_logits = top_k_top_p_filtering(next_token_candidates_logits, top_k=top_k, top_p=top_p)
        elif top_p > 0:
            filtered_next_token_candidates_logits = top_k_top_p_filtering(next_token_candidates_logits, top_p=top_p)
        elif top_k > 0:
            filtered_next_token_candidates_logits = top_k_top_p_filtering(next_token_candidates_logits, top_k=top_k)
        else:
            filtered_next_token_candidates_logits = next_token_candidates_logits
        # sample and get a probability distribution
        probs = F.softmax(filtered_next_token_candidates_logits.float(), dim=-1).sort(descending = True)
        word_list = []
        resulting_strings = tokenizer.batch_decode(probs[1][0])
        for iter, resulting_string in enumerate(resulting_strings):
            probability = probs[0][0][iter].item()
            if dpg.get_value("upper_case_transform"):
                resulting_string = resulting_string.upper()
            if dpg.get_value("lower_case_transform"):
                resulting_string = resulting_string.lower()
            if dpg.get_value("replace_spaces"):
                resulting_string = resulting_string.replace(' ', '')
            if dpg.get_value("lstrip_transform"):
                resulting_string = resulting_string.lstrip()
            if dpg.get_value("rstrip_transform"):
                resulting_string = resulting_string.rstrip()
            if dpg.get_value("strip_transform"):
                resulting_string = resulting_string.strip()
            if dpg.get_value("capitalize_first_letter_transform"):
                resulting_string = resulting_string.capitalize()
            if dpg.get_value("alpha_numaric_transform"):
                resulting_string = ''.join(ch for ch in resulting_string if ch.isalnum())
            if dpg.get_value("alpha_transform"):
                resulting_string = ''.join(ch for ch in resulting_string if ch.isalpha())
            if dpg.get_value("digit_transform"):
                resulting_string = ''.join(ch for ch in resulting_string if ch.isdigit())
            if dpg.get_value("ascii_transform"):
                resulting_string = ''.join(ch for ch in resulting_string if ch.isascii())
            if dpg.get_value("filter_blank_outputs"):
                if resulting_string == "":
                    continue
            word_list.append((resulting_string, probability))

        #all_letters_filtered_list = [word for word in word_list if all_letters_not_included(word=word, string_list = lipogram_naughty_word_list)]

        all_letters_filtered_list = [
        word for word in word_list
        if (
            (not lipogram_naughty_word_list or all_letters_not_included(word=word, string_list=lipogram_naughty_word_list)) and
            (not weak_lipogram_naughty_word_list or any_letters_not_included(word=word, string_list=weak_lipogram_naughty_word_list)) and
            (not reverse_lipogram_nice_word_list or all_letters_included(word=word, string_list=reverse_lipogram_nice_word_list)) and
            (not weak_reverse_lipogram_nice_word_list or any_letters_included(word=word, string_list=weak_reverse_lipogram_nice_word_list)) and
            (not string_in_positon_list or string_in_position(word=word, a_string_list=string_in_positon_list, position_index_list=string_in_positon_index_list)) and
            (not starts_with_string or starts_with(word=word, starting_string=starts_with_string)) and
            (not ends_with_string or ends_with(word=word, ending_string=ends_with_string)) and
            (not constrained_length or equal_to_length(word=word, word_length=constrained_length)) and
            (not constrained_gt_length or greater_than_length(word=word, word_length=constrained_gt_length)) and
            (not constrained_lt_length or less_than_length(word=word, word_length=constrained_lt_length)) and
            (not palindrome_enabled or palindrome(word=word)) and
            (not phonetic_matching_string or phonetic_matching(word=word, phonetic_matching_string=phonetic_matching_string)) and
            (not semantic_matching_string or semantic_matching(word=word, semantic_string=semantic_matching_string, semantic_threshold=semantic_distance_threshold)) and
            (not anagram_string or full_anagram(word=word, a_string=anagram_string)) and
            (not partial_anagram_string or partial_anagram(word=word, a_string=partial_anagram_string)) and
            (not rhyme_string or rhyme(word=word, rhyme_string=rhyme_string)) and
            (not meter_string or meter(word=word, meter_string=meter_string)) and
            (not string_edit_string or string_edit(word=word, string_edit_string=string_edit_string, string_edit_threshold=string_edit_distnace_threhold)) and
            (not syllable_number or syllable(word=word, syllable_number=syllable_number)) and
            (isogram_count < 1 or isogram(word=word, count=isogram_count)) and
            (reverse_isogram_count < 1 or reverse_isogram(word=word, count=reverse_isogram_count))
        )
    ]
            

        #all_letters_filtered_list = [word for word in word_list if all_letters_not_included(word=word, starting_string= "EN")]
        #list(filter(all_letters_included, word_list))
        #print(probs)
        #print(all_letters_filtered_list[0:50])
        #print(probs)


                    
        return all_letters_filtered_list


def tab_key_generate_tokens_callback():
    string_input = dpg.get_value("input_string")
    generated_output = get_next_word_without_e(string_input)
    if dpg.get_value("greedy_decoding"):
        returned_word = generated_output[0][0]
    else:
        probability_weights = tuple(zip(*generated_output))[1]
        returned_word = random.choices(generated_output, weights = probability_weights, k = 1)[0][0]    
    string_input += returned_word
    dpg.set_value("input_string", string_input)

def generate_tokens_callback():
    number_of_tokens = dpg.get_value("num_tokens_to_generate")
    greedy_decoding = dpg.get_value("greedy_decoding")
    string_input = dpg.get_value("input_string")

    for _ in range(number_of_tokens):
        generated_output = get_next_word_without_e(string_input)

        if greedy_decoding:
            returned_word = generated_output[0][0]
        else:
            words, probabilities = zip(*generated_output)
            probabilities_normalized = np.array(probabilities) / np.sum(probabilities)
            returned_word = np.random.choice(words, p=probabilities_normalized)

        string_input += returned_word
        dpg.set_value("input_string", string_input)

def add_generated_word_callback(sender, app_data, user_data):
    current_value = dpg.get_value("input_string")
    new_string = current_value + str(user_data)
    dpg.set_value("input_string", new_string)
    edit_string_callback()

def edit_string_callback():
    string_input = dpg.get_value("input_string")
    returned_words = get_next_word_without_e(string_input)
    #print(returned_words)
    with dpg.popup(parent = "input_string"):
        dpg.add_text("Options")
        dpg.add_separator()
        if len(returned_words) >= 1:
            for word in returned_words:
                dpg.add_selectable(label=word, user_data = word[0], callback = add_generated_word_callback)
        else:
            dpg.add_text("No results with the current filters")
            #print(dpg.get_value(word))
            #print(dpg.get_value("yum"))
    #dpg.log_debug(value)

def typed_calledback(sender, app_data, user_data):
    dpg.set_value("pretty_input_string", str(app_data))

def lipogram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Lipogram Options")
    else:
        dpg.hide_item("Lipogram Options")

def load_naughty_strings_callback():
    global lipogram_naughty_word_list
    string_input = dpg.get_value("lipogram_word_list")
    lipogram_naughty_word_list = string_input.split(" ")
    if not dpg.get_value("naughty_applied"):
        dpg.add_text(tag = "naughty_applied", default_value= "Naughty Strings Applied!", parent = "Lipogram Options")
        dpg.add_text(tag = "naughty_filter" , default_value = "Naughty Strings Filter: " + string_input, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "naughty_filter", value = "Naughty Strings Filter: " + string_input)
    edit_string_callback()

def weak_lipogram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Weak Lipogram Options")
    else:
        dpg.hide_item("Weak Lipogram Options")

def load_weak_naughty_strings_callback():
    global weak_lipogram_naughty_word_list
    string_input = dpg.get_value("weak_lipogram_word_list")
    weak_lipogram_naughty_word_list = string_input.split(" ")
    if not dpg.get_value("weak_naughty_applied"):
        dpg.add_text(tag = "weak_naughty_applied", default_value= "Weak Naughty Strings Applied!", parent = "Weak Lipogram Options")
        dpg.add_text(tag = "weak_naughty_filter" , default_value = "Weak Naughty Strings Filter: " + string_input, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "weak_naughty_filter", value = "Weak Naughty Strings Filter: " + string_input)
    edit_string_callback()

def reverse_lipogram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Reverse Lipogram Options")
    else:
        dpg.hide_item("Reverse Lipogram Options")

def load_reverse_naughty_strings_callback():
    global reverse_lipogram_nice_word_list
    string_input = dpg.get_value("reverse_lipogram_word_list")
    reverse_lipogram_nice_word_list = string_input.split(" ")
    if not dpg.get_value("reverse_nice_applied"):
        dpg.add_text(tag = "reverse_nice_applied", default_value= "Nice Strings Applied!", parent = "Reverse Lipogram Options")
        dpg.add_text(tag = "reverse_nice_filter" , default_value = "Nice Strings Filter: " + string_input, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "reverse_nice_filter", value = "Nice Strings Filter: " + string_input)
    edit_string_callback()

def weak_reverse_lipogram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Weak Reverse Lipogram Options")
    else:
        dpg.hide_item("Weak Reverse Lipogram Options")

def load_weak_reverse_naughty_strings_callback():
    global weak_reverse_lipogram_nice_word_list
    string_input = dpg.get_value("weak_reverse_lipogram_word_list")
    weak_reverse_lipogram_nice_word_list = string_input.split(" ")
    if not dpg.get_value("weak_reverse_nice_applied"):
        dpg.add_text(tag = "weak_reverse_nice_applied", default_value= "Weak Nice Strings Applied!", parent = "Weak Reverse Lipogram Options")
        dpg.add_text(tag = "weak_reverse_nice_filter" , default_value = "Weak Nice Strings Filter: " + string_input, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "weak_reverse_nice_filter", value = "Weak Nice Strings Filter: " + string_input)
    edit_string_callback()

def string_position_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Letter Position Options")
    else:
        dpg.hide_item("Letter Position Options")

def load_string_positon_callback():
    global string_in_positon_list
    global string_in_positon_index_list
    string_input = dpg.get_value("string_for_position")
    int_input = dpg.get_value("string_position_int")
    string_in_positon_list = string_input.split(" ")
    string_in_positon_index_list = int_input.split(" ")
    string_in_positon_index_list = [int(i) for i in string_in_positon_index_list]
    if not dpg.get_value("string_postion_applied"):
        dpg.add_text(tag = "string_postion_applied", default_value= "Strings in Position Applied!", parent = "Letter Position Options")
        dpg.add_text(tag = "string_postion_filter" , default_value = "Strings in Position Applied:  " + string_input + " " + str(int_input), parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "string_postion_filter", value = "Strings in Position Filter: " + string_input + " " + str(int_input))
    edit_string_callback()



def string_starts_with_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Starting String Options")
    else:
        dpg.hide_item("Starting String Options")

def load_string_starts_with_callback():
    global starts_with_string
    starts_with_string = dpg.get_value("string_start_word")
    if not dpg.get_value("string_starts_with_applied"):
        dpg.add_text(tag = "string_starts_with_applied", default_value= "Starting String Applied!", parent = "Starting String Options")
        dpg.add_text(tag = "string_starts_with_filter" , default_value = "Starting String Applied!  " + starts_with_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "string_starts_with_filter", value = "Starting String Filter: " + starts_with_string)
    edit_string_callback()

def string_ends_with_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Ending String Options")
    else:
        dpg.hide_item("Ending String Options")

def load_string_ends_with_callback():
    global ends_with_string
    ends_with_string = dpg.get_value("string_end_word")
    if not dpg.get_value("string_ends_with_applied"):
        dpg.add_text(tag = "string_ends_with_applied", default_value= "Ending String Applied!", parent = "Ending String Options")
        dpg.add_text(tag = "string_ends_with_filter" , default_value = "Ending String Applied!  " + ends_with_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "string_ends_with_filter", value = "Ending String Filter: " + ends_with_string)
    edit_string_callback()

def string_length_constrained_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Length Constrained Options")
    else:
        dpg.hide_item("Length Constrained Options")

def load_string_length_constrained_callback():
    global constrained_length
    constrained_length = dpg.get_value("length_constrained_number")
    constrained_length_str = str(constrained_length)
    if not dpg.get_value("string_length_constrained_applied"):
        dpg.add_text(tag = "string_length_constrained_applied", default_value= "String Length Constraint Applied!", parent = "Length Constrained Options")
        dpg.add_text(tag = "string_length_constrained_filter" , default_value = "String Length Constraint Applied!  " + constrained_length_str, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "string_length_constrained_filter", value = "String Length Constraint Filter: " + constrained_length_str)
    edit_string_callback()

def string_length_gt_constrained_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Length Greater Than Options")
    else:
        dpg.hide_item("Length Greater Than Options")

def load_string_length_gt_constrained_callback():
    global constrained_gt_length
    constrained_gt_length = dpg.get_value("length_gt_constrained_number")
    constrained_gt_length_str = str(constrained_gt_length)
    if not dpg.get_value("string_length_gt_constrained_applied"):
        dpg.add_text(tag = "string_length_gt_constrained_applied", default_value= "String Length Greater Than Constraint Applied!", parent = "Length Greater Than Options")
        dpg.add_text(tag = "string_length_gt_constrained_filter" , default_value = "String Length Greater Than Constraint Applied!  " + constrained_gt_length_str, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "string_length_gt_constrained_filter", value = "String Length Greater Than Constraint Filter: " + constrained_gt_length_str)
    edit_string_callback()


def string_length_lt_constrained_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Length Lesser Than Options")
    else:
        dpg.hide_item("Length Lesser Than Options")

def load_string_length_lt_constrained_callback():
    global constrained_lt_length
    constrained_lt_length = dpg.get_value("length_lt_constrained_number")
    constrained_lt_length_str = str(constrained_lt_length)
    if not dpg.get_value("string_length_lt_constrained_applied"):
        dpg.add_text(tag = "string_length_lt_constrained_applied", default_value= "String Length Lesser Than Constraint Applied!", parent = "Length Lesser Than Options")
        dpg.add_text(tag = "string_length_lt_constrained_filter" , default_value = "String Length Lesser Than Constraint Applied!  " + constrained_lt_length_str, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "string_length_lt_constrained_filter", value = "String Length Lesser Than Constraint Filter: " + constrained_lt_length_str)
    edit_string_callback()


def phonetic_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Phonetic Options")
    else:
        dpg.hide_item("Phonetic Options")

def load_phonetic_callback():
    global phonetic_matching_string
    phonetic_matching_string = dpg.get_value("phonetic_word")
    if not dpg.get_value("phonetic_applied"):
        dpg.add_text(tag = "phonetic_applied", default_value= "Phonetic Constraint Applied!", parent = "Phonetic Options")
        dpg.add_text(tag = "phonetic_filter" , default_value = "Phonetic Constraint Applied!  " + phonetic_matching_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "phonetic_filter", value = "Phonetic Constraint Filter: " + phonetic_matching_string)
    edit_string_callback()

def semantic_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Semantic Options")
    else:
        dpg.hide_item("Semantic Options")

def load_semantic_callback():
    global semantic_matching_string
    global semantic_distance_threshold
    semantic_matching_string = dpg.get_value("semantic_word")
    semantic_distance_threshold = dpg.get_value("semantic_distance")
    semantic_distance_threshold_string = str(semantic_distance_threshold)
    if not dpg.get_value("semantic_applied"):
        dpg.add_text(tag = "semantic_applied", default_value= "Semantic Constraint Applied!", parent = "Semantic Options")
        dpg.add_text(tag = "semantic_filter" , default_value = "Semantic Constraint Applied!  " + semantic_matching_string + " Minimum Similarity: " + semantic_distance_threshold_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "semantic_filter", value = "Semantic Constraint Filter: " + semantic_matching_string)
    edit_string_callback()


def string_edit_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("String Edit Options")
    else:
        dpg.hide_item("String Edit Options")

def load_string_edit_callback():
    global string_edit_string
    global string_edit_distnace_threhold
    string_edit_string = dpg.get_value("string_edit_word")
    string_edit_distnace_threhold = dpg.get_value("string_edit_distance")
    string_edit_distnace_threhold_string = str(string_edit_distnace_threhold)
    if not dpg.get_value("string_edit_applied"):
        dpg.add_text(tag = "string_edit_applied", default_value= "String Edit Constraint Applied!", parent = "String Edit Options")
        dpg.add_text(tag = "string_edit_filter" , default_value = "String Constraint Applied!  " + string_edit_string + " Minimum Similarity: " + string_edit_distnace_threhold_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "string_edit_filter", value = "String Constraint Filter: " + string_edit_string)
    edit_string_callback()

def syllable_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Syllable Options")
    else:
        dpg.hide_item("Syllable Options")

def load_syllable_callback():
    global syllable_number
    syllable_number = dpg.get_value("syllable_number")
    syllable_number_string = str(syllable_number)
    if not dpg.get_value("syllable_applied"):
        dpg.add_text(tag = "syllable_applied", default_value= "Syllable Constraint Applied!", parent = "Syllable Options")
        dpg.add_text(tag = "syllable_filter" , default_value = "Syllable Constraint Applied!  " + syllable_number_string,  parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "syllable_filter", value = "Syllable Constraint Filter: " + syllable_number_string)
    edit_string_callback()

def meter_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Meter Options")
    else:
        dpg.hide_item("Meter Options")

def load_meter_callback():
    global meter_string
    meter_string = dpg.get_value("meter_word")
    if not dpg.get_value("meter_applied"):
        dpg.add_text(tag = "meter_applied", default_value= "Meter Constraint Applied!", parent = "Meter Options")
        dpg.add_text(tag = "meter_filter" , default_value = "Meter Constraint Applied!  " + meter_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "meter_filter", value = "Meter Constraint Filter: " + meter_string)
    edit_string_callback()

def rhyme_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Rhyme Options")
    else:
        dpg.hide_item("Rhyme Options")

def load_rhyme_callback():
    global rhyme_string
    rhyme_string = dpg.get_value("rhyme_word")
    if not dpg.get_value("rhyme_applied"):
        dpg.add_text(tag = "rhyme_applied", default_value= "Rhyme Constraint Applied!", parent = "Rhyme Options")
        dpg.add_text(tag = "rhyme_filter" , default_value = "Rhyme Constraint Applied!  " + rhyme_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "rhyme_filter", value = "Rhyme Constraint Filter: " + rhyme_string)
    edit_string_callback()



def palindrome_callback(sender, app_data, user_data):
    global palindrome_enabled
    if app_data == True:
        dpg.show_item("Palindrome Options")
        palindrome_enabled = True
    else:
        dpg.hide_item("Palindrome Options")
        palindrome_enabled = False

def load_palindrome_callback():
    global palindrome_enabled
    if not dpg.get_value("palindrome_applied"):
        dpg.add_text(tag = "palindrome_applied", default_value= "String Palindromeic Constraint Applied!", parent = "Palindrome Options")
        dpg.add_text(tag = "palindrome_filter" , default_value = "String Palindromeic Constraint Applied!  ",  parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "palindrome_filter", value = "String Palindromeic Constraint Applied! ")
    edit_string_callback()

def anagram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Anagram Options")
    else:
        dpg.hide_item("Anagram Options")

def load_anagram_callback():
    global anagram_string
    anagram_string = dpg.get_value("anagram_string")
    if not dpg.get_value("anagram_applied"):
        dpg.add_text(tag = "anagram_applied", default_value= "Anagram Applied!", parent = "Anagram Options")
        dpg.add_text(tag = "anagram_filter" , default_value = "Anagram Applied!  " + anagram_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "anagram_filter", value = "Anagram Filter: " + anagram_string)
    edit_string_callback()

def partial_anagram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Partial Anagram Options")
    else:
        dpg.hide_item("Partial Anagram Options")

def load_partial_anagram_callback():
    global partial_anagram_string
    partial_anagram_string = dpg.get_value("partial_anagram_string")
    if not dpg.get_value("partial_anagram_applied"):
        dpg.add_text(tag = "partial_anagram_applied", default_value= "Partial Anagram Applied!", parent = "Partial Anagram Options")
        dpg.add_text(tag = "partial_anagram_filter" , default_value = "Partial Anagram Applied!  " + partial_anagram_string, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "partial_anagram_filter", value = "Partial Anagram Filter: " + partial_anagram_string)
    edit_string_callback()

def isogram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Isogram Options")
    else:
        dpg.hide_item("Isogram Options")

def load_isogram_callback():
    global isogram_count
    isogram_count = dpg.get_value("isogram_number")
    isogram_count_str = str(isogram_count)
    if not dpg.get_value("isogram_applied"):
        dpg.add_text(tag = "isogram_applied", default_value= "Isogram Applied!", parent = "Isogram Options")
        dpg.add_text(tag = "isogram_filter" , default_value = "Isogram Applied!  " + isogram_count_str, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "isogram_filter", value = "Isogram Filter: " + isogram_count_str)
    edit_string_callback()

def reverse_isogram_callback(sender, app_data, user_data):
    if app_data == True:
        dpg.show_item("Reverse Isogram Options")
    else:
        dpg.hide_item("Reverse Isogram Options")

def load_reverse_isogram_callback():
    global reverse_isogram_count
    reverse_isogram_count = dpg.get_value("reverse_isogram_number")
    reverse_isogram_count_str = str(reverse_isogram_count)
    if not dpg.get_value("reverse_isogram_applied"):
        dpg.add_text(tag = "reverse_isogram_applied", default_value= "Reverse Isogram Applied!", parent = "Reverse Isogram Options")
        dpg.add_text(tag = "reverse_isogram_filter" , default_value = "Reverse Isogram Applied!  " + reverse_isogram_count_str, parent = "main_window", before = "lipogram")
    else:
        dpg.set_value(item = "reverse_isogram_filter", value = "Reverse Isogram Filter: " + reverse_isogram_count_str)
    edit_string_callback()


def turn_filters_off_callback():
    global lipogram_naughty_word_list
    global weak_lipogram_naughty_word_list
    global reverse_lipogram_nice_word_list
    global weak_reverse_lipogram_nice_word_list
    global string_in_positon_list
    global string_in_positon_index_list
    global starts_with_string
    global ends_with_string
    global phonetic_matching_string
    global semantic_matching_string
    global semantic_distance_threshold
    global constrained_length
    global constrained_gt_length
    global constrained_lt_length
    global palindrome_enabled
    global anagram_string
    global partial_anagram_string
    global isogram_count
    global reverse_isogram_count 
    global string_edit_string
    global string_edit_distnace_threhold
    global syllable_number
    global meter_string
    global rhyme_string

    lipogram_naughty_word_list = []
    weak_lipogram_naughty_word_list = []
    reverse_lipogram_nice_word_list = []
    weak_reverse_lipogram_nice_word_list = []
    string_in_positon_list = []
    string_in_positon_index_list = []
    starts_with_string = ""
    ends_with_string = ""
    phonetic_matching_string = ""
    semantic_matching_string = ""
    semantic_distance_threshold = 0.0
    string_edit_string = ""
    string_edit_distnace_threhold = 0
    syllable_number = 0
    meter_string = ""
    rhyme_string = ""
    constrained_length = 0
    constrained_gt_length = 0
    constrained_lt_length = 0
    palindrome_enabled = False
    anagram_string = ""
    partial_anagram_string = ""
    isogram_count = 0
    reverse_isogram_count = 0
 
    filters = [
    "partial_anagram_applied", "partial_anagram_filter",
    "naughty_applied", "naughty_filter",
    "weak_naughty_applied", "weak_naughty_filter",
    "reverse_nice_applied", "reverse_nice_filter",
    "weak_reverse_nice_applied", "weak_reverse_nice_filter",
    "string_position_applied", "string_position_filter",
    "string_starts_with_applied", "string_starts_with_filter",
    "string_ends_with_applied", "string_ends_with_filter",
    "string_length_constrained_applied", "string_length_constrained_filter",
    "string_length_gt_constrained_applied", "string_length_gt_constrained_filter",
    "string_length_lt_constrained_applied", "string_length_lt_constrained_filter",
    "phonetic_applied", "phonetic_filter",
    "semantic_applied", "semantic_filter",
    "string_edit_applied", "string_edit_filter",
    "syllable_applied", "syllable_filter",
    "meter_applied", "meter_filter",
    "rhyme_applied", "rhyme_filter",
    "palindrome_applied", "palindrome_filter",
    "anagram_applied", "anagram_filter",
    "isogram_applied", "isogram_filter",
    "reverse_isogram_applied", "reverse_isogram_filter"]

    for filter_name in filters:
        if dpg.get_value(filter_name):
            dpg.delete_item(filter_name)

    edit_string_callback()
    #TODO: Finish this


dpg.create_context()
monitor = get_monitors()[0]
screen_width = monitor.width
screen_height = monitor.height
dpg.create_viewport(width=screen_width, height=screen_height)
dpg.setup_dearpygui()
dpg.toggle_viewport_fullscreen()

#dpg.configure_app(docking=True, dock_space = True)

dpg.enable_docking(dock_space=True)

with dpg.font_registry():
    # Download font here: https://fonts.google.com/specimen/Open+Sans
    font = dpg.add_font("OpenSans-VariableFont_wdth,wght.ttf", 15, tag="ttf-font"
    )

dpg.bind_font(font)
readme_pos = ((screen_width) // 2, (screen_height) // 2)
window_size = (screen_width // 2, screen_height // 2.5)
window_positions = [
    (0, 0),
    (window_size[0], window_size[1]),
    (window_size[0] * 2, 0),
    (window_size[0], 0),
]


"""
Doesn't work... 

def edited_call(sender, app_data, user_data):
    global starttime
    newtime = time.time()
    if newtime - starttime > 2:
        print(dpg.get_item_)
        print(dpg.get_item_state("input_string"))
        edit_string_callback()
        starttime = newtime
"""



#edit_string_callback("This is an example")


with dpg.window(tag="main_window", label="CTGS - Contrained Text Generation Studio", no_close=True, width=window_size[0], height=window_size[1], pos=window_positions[0]) as window:
    dpg.add_text("Main Text Box")
    dpg.add_text("Right Click within the text box for LM recommended continuations with constraints applied!")
    dpg.add_input_text(tag = "input_string", width = 900, height = 500, multiline=True, default_value = "Type something here!")

    with dpg.window(tag="load_model_window", label="Model Settings", no_close=True, width=window_size[0], height=window_size[1], pos=window_positions[1]) as model_window:
        dpg.add_text("Enter the name of the pre-trained model from transformers that we are using for Text Generation")
        _help("Make sure torch.cuda.is_available returns True to get GPU support for your models, which significantly speeds them up!")
        dpg.add_text("This will download a new model, so it may take awhile or even break if the model is too large")
        dpg.add_input_text(tag = "model_name", width = 500, height = 500, default_value="EleutherAI/pythia-1b", label = "Huggingface Model Name")
        dpg.add_button(tag="load_model", label="load_model", callback=load_model)
        _help("If ran from the commnad line, you can see the downloading progress in the terminal. Be patient, it can take awhile to download a model!")
        dpg.add_combo(items=["32bit", "16bit", "8bit"], tag = "percision", label = "Select the model percision", default_value ="32bit")
    with dpg.window(tag="Filter Options", label="Filters", show=True, no_close=True, width=window_size[0], height=window_size[1], pos=window_positions[2]) as filter_options:
        dpg.add_text("Select which filters you want to enable")
        dpg.add_text("List of enabled filters: ")
        dpg.add_checkbox(tag="lipogram", label = "All Strings Banned", callback=lipogram_callback)
        _help("A lipogram is when a particular letter or group of strings is avoided.")
        with dpg.child_window(tag="Lipogram Options", show = False, height = 100, width = 600) as lipogram_selection_window:
            dpg.add_text("Add banned letters or strings seperated by a space!")
            dpg.add_input_text(tag = "lipogram_word_list", width = 500, height = 500, label = "Banned Strings")
            dpg.add_button(tag="lipogram_button", label="Load Banned Strings", callback=load_naughty_strings_callback)
        dpg.add_checkbox(tag="weak_lipogram", label = "Any Strings Banned", callback=weak_lipogram_callback)
        _help("A weak lipogram is when at least one of a particular letter or group of strings is avoided.")
        with dpg.child_window(tag="Weak Lipogram Options", show = False, height = 100, width = 600) as weak_lipogram_selection_window:
            dpg.add_text("Add banned letters or strings seperated by a space!")
            dpg.add_input_text(tag = "weak_lipogram_word_list", width = 500, height = 500, label = "Banned Strings")
            dpg.add_button(tag="weak_lipogram_button", label="Load Banned Strings", callback = load_weak_naughty_strings_callback)
        dpg.add_checkbox(tag="reverse_lipogram", label = "All Strings Required", callback=reverse_lipogram_callback)
        _help("A reverse lipogram is when a particular letter or group of strings is forced.")
        with dpg.child_window(tag="Reverse Lipogram Options", show = False, height = 100, width = 600) as reverse_lipogram_selection_window:
            dpg.add_text("Add forced letters or strings seperated by a space!")
            dpg.add_input_text(tag = "reverse_lipogram_word_list", width = 500, height = 500, label = "Forced Strings")
            dpg.add_button(tag="reverse_lipogram_button", label="Load Forced Strings", callback = load_reverse_naughty_strings_callback)
        dpg.add_checkbox(tag="weak_reverse_lipogram", label = "Any Strings Required", callback=weak_reverse_lipogram_callback)
        _help("A weak reverse lipogram is when at least one of a particular letter or group of strings is forced.")


        with dpg.child_window(tag="Weak Reverse Lipogram Options", show = False, height = 100, width = 600) as weak_reverse_selection_window:
            dpg.add_text("Add forced letters or strings seperated by a space!")
            dpg.add_input_text(tag = "weak_reverse_lipogram_word_list", width = 500, height = 500, label = "Forced Strings")
            dpg.add_button(tag="weak_reverse_lipogram_button", label="Load Forced Strings", callback = load_weak_reverse_naughty_strings_callback)

        dpg.add_checkbox(tag="string_position", label = "String In Position", callback = string_position_callback)
        _help("This allows one to force a particular letter in a particular position of a string\n" "NOTE: It's recommended to combine this with whitespace stripping")

        with dpg.child_window(tag="Letter Position Options", show = False, height = 130, width = 600) as letter_position_selection_window:
            dpg.add_text("Add the position that you want to force a particular letter to appear at! Give a list of characters seperated by a space")
            dpg.add_input_text(tag = "string_for_position", width = 500, height = 500, label = "List of characters")
            dpg.add_text("Corresponding list of indexes for each character. Must be the same length as the list of characters")
            dpg.add_input_text(tag = "string_position_int", width = 500, height = 500, label = "List of indexes")
            dpg.add_button(tag="string_position_button", label="Load Strings", callback = load_string_positon_callback)

        dpg.add_checkbox(tag="string_starts", label = "String Starts With", callback = string_starts_with_callback)
        _help("This allows one to guarantee that the string will start with a particular set of letters")

        with dpg.child_window(tag="Starting String Options", show = False, height = 100, width = 600) as starting_string_selection_window:
            dpg.add_text("Add the string that the word should start with")
            dpg.add_input_text(tag = "string_start_word", width = 500, height = 500, label = "String for word to start with")
            dpg.add_button(tag="string_start_button", label="Load Starting String", callback=load_string_starts_with_callback)

        dpg.add_checkbox(tag="string_ends", label = "String Ends With", callback = string_ends_with_callback)
        _help("This allows one to guarantee that the string will end with a particular set of letters")
        with dpg.child_window(tag="Ending String Options", show = False, height = 100, width = 600) as ending_string_selection_window:
            dpg.add_text("Add the string that the word should end with")
            dpg.add_input_text(tag = "string_end_word", width = 500, height = 500, label = "String for word to end with")
            dpg.add_button(tag="string_end_button", label="Load Ending String", callback=load_string_ends_with_callback)

        dpg.add_checkbox(tag="string_edit_distance_check", label = "String Edit Distance Matching", callback = string_edit_callback)
        _help("This uses Levenshtein distance to return all strings with lower edit distance then specified")

        with dpg.child_window(tag="String Edit Options", show = False, height = 100, width = 600) as string_edit_window:
            dpg.add_text("Specify the word you want to string edit distance match against")
            dpg.add_input_text(tag = "string_edit_word", width = 500, height = 500, label = "String to match using Levenshtein distance")
            dpg.add_input_int(tag = "string_edit_distance", label = "Similarity that the word has to be higher than")
            dpg.add_button(tag="string_edit_constrained_button", label="Load String Edit Distance Matching Strings", callback=load_string_edit_callback)

        dpg.add_checkbox(tag="length_constrained", label = "String Length Equal To", callback = string_length_constrained_callback)
        _help("This allows one to guarantee that the string will be of a particular length\n" "NOTE: It's recommended to combine this filter with whitespace stripping")
        with dpg.child_window(tag="Length Constrained Options", show = False, height = 100, width = 600) as length_constrained_selection_window:
            dpg.add_text("Specify the length that you want your strings to be constrained to")
            dpg.add_input_int(tag = "length_constrained_number", label = "Number to constrain the length with")
            dpg.add_button(tag="length_constrained_button", label="Load Length Constrained String", callback=load_string_length_constrained_callback)

        dpg.add_checkbox(tag="length_gt", label = "String Length Greater Than", callback = string_length_gt_constrained_callback)
        _help("This allows one to guarantee that the string will be longar than a particular length\n" "NOTE: It's recommended to combine this filter with whitespace stripping")

        with dpg.child_window(tag="Length Greater Than Options", show = False, height = 100, width = 600) as length_gt_selection_window:
            dpg.add_text("Specify the length that you want your strings to be greater than")
            dpg.add_input_int(tag = "length_gt_constrained_number", label = "Number to constrain the length to be greater than")
            dpg.add_button(tag="length_gt_constrained_button", label="Load Length Constrained String", callback=load_string_length_gt_constrained_callback)

        dpg.add_checkbox(tag="length_lt", label = "String Length Lesser Than", callback = string_length_lt_constrained_callback)
        _help("This allows one to guarantee that the string will be shorter than particular length\n" "NOTE: It's recommended to combine this filter with whitespace stripping")

        with dpg.child_window(tag="Length Lesser Than Options", show = False, height = 100, width = 600) as length_lt_selection_window:
            dpg.add_text("Specify the length that you want your strings to be lesser than")
            dpg.add_input_int(tag = "length_lt_constrained_number", label = "Number to constrain the length to be lesser than")
            dpg.add_button(tag="length_lt_constrained_button", label="Load Length Constrained String", callback=load_string_length_lt_constrained_callback)


        dpg.add_checkbox(tag="phonetic", label = "Phonetic Matching", callback = phonetic_callback)
        _help("This uses the double-metaphone algorithm to phonetically match your string with the passed in string")

        with dpg.child_window(tag="Phonetic Options", show = False, height = 100, width = 600) as phonetic_selection_window:
            dpg.add_text("Specify the word you want to phonetically match against")
            dpg.add_input_text(tag = "phonetic_word", width = 500, height = 500, label = "String to match Phonetically")
            dpg.add_button(tag="phonetic_constrained_button", label="Load Phonetically Matching Strings", callback=load_phonetic_callback)

        dpg.add_checkbox(tag="semantic", label = "Semantic Matching", callback = semantic_callback)
        _help("This uses fasttext word vectors to return strings which are semantically similar to the provided string")

        with dpg.child_window(tag="Semantic Options", show = False, height = 100, width = 600) as semantic_selection_window:
            dpg.add_text("Specify the word you want to semantically match against")
            dpg.add_input_text(tag = "semantic_word", width = 500, height = 500, label = "String to match Semantically")
            dpg.add_input_float(tag = "semantic_distance", label = "Similarity that the word has to be higher than")
            dpg.add_button(tag="semantic_constrained_button", label="Load Semantic Matching Strings", callback=load_semantic_callback)

        dpg.add_checkbox(tag="syllable", label = "Syllable Count", callback = syllable_callback)
        _help("This will return strings with the specified number of syllables.")

        with dpg.child_window(tag="Syllable Options", show = False, height = 100, width = 600) as syllable_selection_window:
            dpg.add_text("Specify the number of Syllables you want in your word")
            dpg.add_input_int(tag = "syllable_number", label = "Number of Syllables in word")
            dpg.add_button(tag="syllable_constrained_button", label="Load Syllable Constrained Strings", callback=load_syllable_callback)

        dpg.add_checkbox(tag="meter", label = "Meter", callback = meter_callback)
        _help("This will return strings with the matching stress pattern of a passed in string, also called meter")

        with dpg.child_window(tag="Meter Options", show = False, height = 100, width = 600) as meter_selection_window:
            dpg.add_text("Specify the word whose meter you want to match")
            dpg.add_input_text(tag = "meter_word", width = 500, height = 500, label = "String to match based on stress pattern")
            dpg.add_button(tag="meter_constrained_button", label="Load Meter Constrained Strings", callback=load_meter_callback)

        dpg.add_checkbox(tag="rhyme", label = "Rhyme", callback = rhyme_callback)
        _help("This will return strings that rhyme with the provided string")

        with dpg.child_window(tag="Rhyme Options", show = False, height = 100, width = 600) as rhyme_selection_window:
            dpg.add_text("Specify the word which you want to rhyme with")
            dpg.add_input_text(tag = "rhyme_word", width = 500, height = 500, label = "String to rhyme against")
            dpg.add_button(tag="rhyme_constrained_button", label="Load Rhyming Constrained Strings", callback=load_rhyme_callback)

                
        dpg.add_checkbox(tag="palindrome", label = "Palindrome", callback = palindrome_callback)
        _help("A palindrome is a string which reads the same backward as forward, such as madam or racecar")

        with dpg.child_window(tag="Palindrome Options", show = False, height = 100, width = 600) as palindrome_selection_window:
            dpg.add_text("Press the button to force all generated strings to be palindromes!")
            dpg.add_button(tag="palindrome_button_enabled", label="Load Palindromic String", callback=load_palindrome_callback)



        dpg.add_checkbox(tag="anagram", label = "Anagram", callback = anagram_callback)
        _help("An anagram is a string formed by rearranging the letters of a different string")
        with dpg.child_window(tag="Anagram Options", show = False, height = 100, width = 600) as anagram_selection_window:
            dpg.add_text("Specify the string that you want generated strings to be anagrams of!")
            dpg.add_input_text(tag = "anagram_string", width = 500, height = 500, label = "Anagram String")
            dpg.add_button(tag="anagram_button", label="Load Anagramic String", callback=load_anagram_callback)

        dpg.add_checkbox(tag="partial_anagram", label = "Partial Anagram", callback = partial_anagram_callback)
        _help("A partial anagram is a string constructed by rearranging some or all of the letters of a different string")

        with dpg.child_window(tag="Partial Anagram Options", show = False, height = 100, width = 600) as partial_anagram_selection_window:
            dpg.add_text("Specify the string that you want generated strings to be partial anagrams of!")
            dpg.add_input_text(tag = "partial_anagram_string", width = 500, height = 500, label = "Partial Anagram String")
            dpg.add_button(tag="partial_anagram_button", label="Load Partial Anagramic String", callback=load_partial_anagram_callback)

        dpg.add_checkbox(tag="isogram", label = "Isogram", callback = isogram_callback)
        _help("An isogram is a string in which none of its characters appear more than the provided number of times")

        with dpg.child_window(tag="Isogram Options", show = False, height = 100, width = 600) as isogram_window:
            dpg.add_text("Specify the number of times characters are allowed to repeat")
            dpg.add_input_int(tag = "isogram_number", label = "Number of times characters can repeat", default_value = 1)
            dpg.add_button(tag="isogram_button", label="Load Isogramic String", callback=load_isogram_callback)

        dpg.add_checkbox(tag="reverse_isogram", label = "Reverse Isogram", callback = reverse_isogram_callback)
        _help("A reverse isogram is a string in which all of its characters appear more than the provided number of times")
    
        with dpg.child_window(tag="Reverse Isogram Options", show = False, height = 100, width = 600) as reverse_isogram_window:
            dpg.add_text("Specify the number of times that characters must repeat")
            dpg.add_input_int(tag = "reverse_isogram_number", label = "Number of times characters must repeat", default_value = 1)
            dpg.add_button(tag="reverse_isogram_button", label="Load Reverse Isogramic String", callback=load_reverse_isogram_callback)
        
        dpg.add_button(tag="remove_filters", label = "Reset Filters", callback = turn_filters_off_callback)
    

    dpg.add_button(label="Predict New Tokens", callback=edit_string_callback)
    dpg.add_button(label="AI generate some tokens", callback=generate_tokens_callback)
    dpg.add_input_int(tag = "top_p", label = "Number of tokens for top P sampling", default_value = 0)
    _help("Top-p sampling chooses from the smallest possible set of words whose cumulative probability exceeds the probability p")
    dpg.add_input_int(tag = "top_k", label = "Number of tokens for top K sampling", default_value = 0)
    _help("In Top-K sampling, the K most likely next words are filtered and the probability mass is redistributed among only those K next words.")
    dpg.add_input_float(tag = "temperature", label = "Temperature", default_value = 1.0)
    _help("lowering the so-called temperature increases the likelihood of high probability words and decreasing the likelihood of low probability words. Increasing does the opposite.")
    dpg.add_input_int(tag = "num_tokens_to_generate", label = "Number of tokens to generate", default_value = 20)
    _help("This only impacts how many tokens are generated by the AI generate some tokens button")
    dpg.add_checkbox(tag="greedy_decoding", label = "Enable greedy decoding?")
    _help("This will override top-p and top-k sampling and only select the most likely token everytime")
    
    with dpg.window(tag="Transforms", show=True, label="Text Transforms", no_close=True, width=window_size[0], height=window_size[1], pos=window_positions[3]) as pre_filter_options:
        dpg.add_text("These are text transforms which will apply to all tokens *before* the actual filters are applied")
        dpg.add_text("Using these transforms will frequently assist with increasing the vocabulary that is available after a filter is applied")
        dpg.add_text("These transforms can also prevent generation of undesierable characters")
        dpg.add_checkbox(tag="upper_case_transform", label = "Uppercase transform")
        _help("Use this to cause all text to be UPPERCASED LIKE THIS")
        dpg.add_checkbox(tag="lower_case_transform", label = "Lowercase transform")
        _help("Use this to force all tokens to be lowercased like this")
        dpg.add_checkbox(tag="replace_spaces", label = "Remove spaces")
        _help("Use this to force all tokens to not have spaces likethis")
        dpg.add_checkbox(tag = "lstrip_transform", label = "Left side strip")
        _help("Use this to stip spaces from the left of the text")
        dpg.add_checkbox(tag = "rstrip_transform", label = "Right side strip")
        _help("Use this to stip spaces from the right of the text")
        dpg.add_checkbox(tag = "strip_transform", label = "Full strip")
        _help("Use this to stip spaces from both sides of the text")
        dpg.add_checkbox(tag = "capitalize_first_letter_transform", label = "Capitalize the first letter")
        _help("Use this to force all tokens to have their first letter capitalized Like This")
        dpg.add_checkbox(tag = "alpha_numaric_transform", label = "Force tokens to be alpha numaric")
        _help("Use this to force all tokens to be alphanumaric, meaning only using the alphabet or numbers")
        dpg.add_checkbox(tag = "alpha_transform", label = "Force tokens to be alphaic")
        _help("Use this to force all tokens to be alphaic, meaning only using the alphabet")
        dpg.add_checkbox(tag = "digit_transform", label = "Force tokens to be digits")
        _help("Use this to force all tokens to be digits, meaning only using numbers")
        dpg.add_checkbox(tag = "ascii_transform", label = "Force tokens to be ascii characters")
        _help("Use this to force all tokens to be ascii characters - to filter out unicode.")
        dpg.add_checkbox(tag = "filter_blank_outputs", label = "Filter blank outputs")
        _help("After applying some other transforms, there may be leftover blanks. This will remove them")

    with dpg.window(tag="Readme", show=True, label="Read Me First", no_close=False, pos=readme_pos) as read_me_options:
        dpg.add_text(default_value ="Usage tips:")
        dpg.add_text(default_value="The first time you run this, it may take a few minutes to be ready to run because distilgpt2 and fasttext are being downloaded from huggingface. Wait until you see a messege in the Model Settings window about it being succesfully loaded before trying to run CTGS.", bullet = True)
        dpg.add_text(default_value ="Right click anywhere within the text box for a list of continuations with the enabled filters to appear", bullet = True)
        dpg.add_text(default_value ="The F1 key generates new tokens given the context (populates the right click continuations box), and is equivilant to the Predict New Tokens button", bullet = True)
        dpg.add_text(default_value ="The F2 key directly inserts the next token into the text box using the models decoder (and top_p, top_k, temperature) settings. It's equivilant to the AI generate some tokens button", bullet = True)
        dpg.add_text(default_value="If you're not seeing continuations using F2 or the ai generate some token button, make sure that it's not generating spaces, line returns, or other blank characters", bullet = True)
        dpg.add_text(default_value="Use the text transforms list to apply transforms to the vocabulary before the constraints are applied. To mitigate the problem of the LM generating spaces, you could for example use the filter blank outputs transform", bullet = True)
        dpg.add_text(default_value="After typing or copying/pasting text into the text box, use the Predict New Tokens button or F1 to get new continuations (what you see when you right click) given your context.", bullet = True)
        dpg.add_text(default_value="After publication, I intend to open source this. In the next release, I will add support for BERT/Masked Language Models. I've already tested and know they work using this technique in principle.")
        dpg.add_text(default_value = "This utility is written using the DearPyGUI GUI library, and has the tiling mode enabled. You can move around the windows and tile them with each other to your hearts desire. I think a tool like this is a natural fit for a tiling window manager style layout")
        dpg.add_text(default_value = "Hovering over a green question-mark will pop-up a tooltip to give you context/help")
        dpg.add_text(default_value = "This window can be closed with the X in the top right")


with dpg.handler_registry():
    dpg.add_key_press_handler(key = 113, callback=tab_key_generate_tokens_callback) ##F2 inserts most likely token
    dpg.add_key_press_handler(key = 112, callback=edit_string_callback) ##F1 generates new tokens

load_model(the_name="EleutherAI/pythia-1b")

edit_string_callback()
dpg.set_global_font_scale(1.0)
#dpg.toggle_viewport_fullscreen()
dpg.show_viewport()
#dpg.set_primary_window("main_window", True)
dpg.start_dearpygui()
dpg.destroy_context()