From c61e012d21fce50e0b3269417ee33e555a16cdaa Mon Sep 17 00:00:00 2001
From: KT313 <73772644+KT313@users.noreply.github.com>
Date: Tue, 22 Oct 2024 16:39:15 +0200
Subject: [PATCH 1/2] minor changes with pyflakes and pycodestyle
---
extensions/perplexity_colors/script.py | 97 ++++++++++++++------------
1 file changed, 54 insertions(+), 43 deletions(-)
diff --git a/extensions/perplexity_colors/script.py b/extensions/perplexity_colors/script.py
index 2a986ac40b..c5fa724ac3 100644
--- a/extensions/perplexity_colors/script.py
+++ b/extensions/perplexity_colors/script.py
@@ -1,11 +1,10 @@
-import time
-
import gradio
import numpy as np
import torch
from transformers import LogitsProcessor
+import colorsys
-from modules import html_generator, shared
+from modules import shared
params = {
'active': True,
@@ -81,6 +80,7 @@ def __call__(self, input_ids, scores):
# Stores the perplexity and top probabilities
+# global ppl_logits_processor
ppl_logits_processor = None
@@ -109,64 +109,74 @@ def output_modifier(text):
gen_tokens = [shared.tokenizer.decode(token_id) for token_id in gen_token_ids]
sel_probs = ppl_logits_processor.selected_probs[1:]
- end_part = '' if params['probability_dropdown'] else '' # Helps with finding the index after replacing part of the text.
+ formatted_text = ""
- i = 0
for token, prob, ppl, top_tokens, top_probs in zip(gen_tokens, sel_probs, perplexities, top_tokens_list, top_probs_list):
color = 'ffffff'
- if params['color_by_probability'] and params['color_by_perplexity']:
- color = probability_perplexity_color_scale(prob, ppl)
- elif params['color_by_perplexity']:
+ # if params['color_by_probability'] and params['color_by_perplexity']:
+ # color = probability_perplexity_color_scale(prob, ppl)
+ if params['color_by_perplexity']:
color = perplexity_color_scale(ppl)
elif params['color_by_probability']:
color = probability_color_scale(prob)
- if token in text[i:]:
- if params['probability_dropdown']:
- text = text[:i] + text[i:].replace(token, add_dropdown_html(token, color, top_tokens, top_probs[0], ppl), 1)
- else:
- text = text[:i] + text[i:].replace(token, add_color_html(token, color), 1)
- i += text[i:].find(end_part) + len(end_part)
+
+ if params['probability_dropdown']:
+ formatted_token = add_dropdown_html(token, color, top_tokens, top_probs[0], ppl)
+ else:
+ formatted_token = add_color_html(token, color)
+
+ formatted_text += formatted_token
+
+ # wonky fix to prevent the later html processing from making the first token into a separate paragraph and disabling its dropdown.
+ # this adds a dummy entry which gets made into an empty
paragraph instead of the first token
+ if params['probability_dropdown']:
+ formatted_text = '' + formatted_text
# Use full perplexity list for calculating the average here.
print('Average perplexity:', round(np.mean(ppl_logits_processor.perplexities_list[:-1]), 4))
# t1 = time.time()
# print(f"Modifier: {(t1-t0):.3f} s")
# About 50 ms
- return text
+ return formatted_text
def probability_color_scale(prob):
'''
Green-yellow-red color scale
'''
+ # hue (0.0 = red, 0.33 = green)
+ # saturation (0.0 = gray / white, 1.0 = normal, just leave at 1.0)
+ # brightness (0.0 = black, 1.0 = brightest, use 0.5 instead of 1.0 for better readability)
- rv = 0
- gv = 0
- if prob <= 0.5:
- rv = 'ff'
- gv = hex(int(255 * prob * 2))[2:]
- if len(gv) < 2:
- gv = '0' * (2 - len(gv)) + gv
- else:
- rv = hex(int(255 - 255 * (prob - 0.5) * 2))[2:]
- gv = 'ff'
- if len(rv) < 2:
- rv = '0' * (2 - len(rv)) + rv
+ hue = prob * 0.33
+ rv, gv, bv = colorsys.hsv_to_rgb(hue, 1.0, 0.7)
- return rv + gv + '00'
+ # to hex
+ hex_col = f"{int(rv*255):02x}{int(gv*255):02x}{int(bv*255):02x}"
+
+ return hex_col
def perplexity_color_scale(ppl):
'''
Red component only, white for 0 perplexity (sorry if you're not in dark mode)
'''
- value = hex(max(int(255.0 - params['ppl_scale'] * (float(ppl) - 1.0)), 0))[2:]
- if len(value) < 2:
- value = '0' * (2 - len(value)) + value
+ # hue (0.0 = red)
+ # saturation (1.0 = red)
+ # brightness (0.0 = black, 1.0 = red)
+ # scale saturation from white to red the higher the perplexity
+
+ ppl = min(ppl, params['ppl_scale']) # clip ppl to 0-params['ppl_scale'] for color scaling. 15 should be fine for clipping and scaling
+ sat = ppl / params['ppl_scale']
+ rv, gv, bv = colorsys.hsv_to_rgb(0.0, sat, 1.0)
+
+ # to hex
+ hex_col = f"{int(rv*255):02x}{int(gv*255):02x}{int(bv*255):02x}"
- return 'ff' + value + value
+ return hex_col
+# are you sure this is needed? Since perplexity is proportional to probability, it would make more sense to just pick one of the two
def probability_perplexity_color_scale(prob, ppl):
'''
Green-yellow-red for probability and blue component for perplexity
@@ -193,7 +203,7 @@ def probability_perplexity_color_scale(prob, ppl):
def add_color_html(token, color):
- return f'{token}'
+ return f'{token}'
# TODO: Major issue: Applying this to too many tokens will cause a permanent slowdown in generation speed until the messages are removed from the history.
@@ -201,7 +211,15 @@ def add_color_html(token, color):
# Potential solution is maybe to modify the main generation code to send just the internal text and not the visible history, to avoid moving too much around.
# I wonder if we can also avoid using deepcopy here.
def add_dropdown_html(token, color, top_tokens, top_probs, perplexity=0):
- html = f'{token}'
+
+ # for now replace all "\n" with "
" (ascii code for newline) since the postprocessing later messes up the formatting.
+ # Doesn't get displayed properly but at least doesn't mess up the formatting.
+ # If there are any newlines "\n", for some reason everything after the first newline will be made into a separate paragraph.
+ token = token.replace("\n", "
")
+
+ # replace spaces in token with non-linebreaking space character for html
+ token = token.replace(" ", " ")
+ html = f'{token}'
for token_option, prob in zip(top_tokens, top_probs):
# TODO: Bold for selected token?
# Using divs prevented the problem of divs inside spans causing issues.
@@ -213,7 +231,7 @@ def add_dropdown_html(token, color, top_tokens, top_probs, perplexity=0):
if perplexity != 0:
ppl_color = perplexity_color_scale(perplexity)
html += f'Perplexity: | {perplexity:.4f} |
'
- html += '
'
+ html += '
'
return html # About 750 characters per token...
@@ -263,13 +281,6 @@ def custom_css():
pre {
white-space: pre-wrap;
}
-
- # TODO: This makes the hover menus extend outside the bounds of the chat area, which is good.
- # However, it also makes the scrollbar disappear, which is bad.
- # The scroll bar needs to still be present. So for now, we can't see dropdowns that extend past the edge of the chat area.
- #.chat {
- # overflow-y: auto;
- #}
"""
@@ -282,7 +293,7 @@ def convert_to_markdown(string):
return '
' + string + '
'
-html_generator.convert_to_markdown = convert_to_markdown
+# html_generator.convert_to_markdown = convert_to_markdown
def ui():
From fcd72afe5616301d8657fd5e75ed74f2f7419606 Mon Sep 17 00:00:00 2001
From: KT313 <73772644+KT313@users.noreply.github.com>
Date: Wed, 23 Oct 2024 08:02:30 +0200
Subject: [PATCH 2/2] addition to skip output modifier if ppl_logits_processor
== None so new chat can be created when no model loaded
---
extensions/perplexity_colors/script.py | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/extensions/perplexity_colors/script.py b/extensions/perplexity_colors/script.py
index c5fa724ac3..7211901b5e 100644
--- a/extensions/perplexity_colors/script.py
+++ b/extensions/perplexity_colors/script.py
@@ -95,7 +95,7 @@ def output_modifier(text):
global ppl_logits_processor
# t0 = time.time()
- if not params['active']:
+ if not params['active'] or ppl_logits_processor == None:
return text
# TODO: It's probably more efficient to do this above rather than modifying all these lists