LIFineTuned

Paused

App Files Files Community

alexkueck commited on Jun 28, 2023

Commit

9e85ff2

1 Parent(s): 3054dce

Update utils.py

Browse files

Files changed (1) hide show

utils.py +58 -0

utils.py CHANGED Viewed

@@ -150,6 +150,64 @@ def greedy_search(input_ids: torch.Tensor,
                 gc.collect()
                 return
 def convert_to_markdown(text):
     text = text.replace("$","&#36;")
     def replace_leading_tabs_and_spaces(line):

                 gc.collect()
                 return
+########################################
+#Predict
+def predict(text,
+            history,
+            top_p,
+            temperature,
+            max_length_tokens,
+            max_context_length_tokens,):
+    if text=="":
+        yield history,"Empty context."
+        return
+    try:
+        model
+    except:
+        yield [[text,"No Model Found"]],[],"No Model Found"
+        return
+    inputs = generate_prompt_with_history(text,history,tokenizer,max_length=max_context_length_tokens)
+    if inputs is None:
+        yield history,"Input too long."
+        return
+    else:
+        prompt,inputs=inputs
+        begin_length = len(prompt)
+    input_ids = inputs["input_ids"][:,-max_context_length_tokens:].to(device)
+    torch.cuda.empty_cache()
+    #torch.no_grad() bedeutet, dass für die betreffenden tensoren keine Ableitungen berechnet werden bei der backpropagation
+    #hier soll das NN ja auch nicht geändert werden 8backprop ist nicht nötig), da es um interference-prompts geht!
+    with torch.no_grad():
+        #die vergangenen prompts werden alle als Tupel in history abgelegt sortiert nach 'Human' und 'AI'- dass sind daher auch die stop-words, die den jeweils nächsten Eintrag kennzeichnen
+        for x in greedy_search(input_ids,model,tokenizer,stop_words=["[|Human|]", "[|AI|]"],max_length=max_length_tokens,temperature=temperature,top_p=top_p):
+            if is_stop_word_or_prefix(x,["[|Human|]", "[|AI|]"]) is False:
+                if "[|Human|]" in x:
+                    x = x[:x.index("[|Human|]")].strip()
+                if "[|AI|]" in x:
+                    x = x[:x.index("[|AI|]")].strip()
+                x = x.strip()
+                a, b=   [[y[0],convert_to_markdown(y[1])] for y in history]+[[text, convert_to_markdown(x)]],history + [[text,x]]
+                yield a, b, "Generating..."
+            if shared_state.interrupted:
+                shared_state.recover()
+                try:
+                    yield a, b, "Stop: Success"
+                    return
+                except:
+                    pass
+    del input_ids
+    gc.collect()
+    torch.cuda.empty_cache()
+    try:
+        yield a,b,"Generate: Success"
+    except:
+        pass
 def convert_to_markdown(text):
     text = text.replace("$","&#36;")
     def replace_leading_tabs_and_spaces(line):