Omost

Sleeping

App Files Files Community

layerdiffusion commited on May 30

Commit

a1c7119

•

1 Parent(s): a9cb4cf

i

Browse files

Files changed (2) hide show

app.py +16 -1
chat_interface.py +16 -10

app.py CHANGED Viewed

@@ -28,6 +28,7 @@ from diffusers.models.attention_processor import AttnProcessor2_0
 from transformers import CLIPTextModel, CLIPTokenizer
 from lib_omost.pipeline import StableDiffusionXLOmostPipeline
 from chat_interface import ChatInterface
 import lib_omost.canvas as omost_canvas
@@ -130,9 +131,23 @@ def chat_fn(message: str, history: list, seed:int, temperature: float, top_p: fl
     streamer = TextIteratorStreamer(llm_tokenizer, timeout=10.0, skip_prompt=True, skip_special_tokens=True)
     generate_kwargs = dict(
         input_ids=input_ids,
         streamer=streamer,
         max_new_tokens=max_new_tokens,
         do_sample=True,
         temperature=temperature,
@@ -148,7 +163,7 @@ def chat_fn(message: str, history: list, seed:int, temperature: float, top_p: fl
     for text in streamer:
         outputs.append(text)
         # print(outputs)
-        yield "".join(outputs)
     print(f'Chat end at {time.time() - time_stamp:.2f} seconds:', message)
     return

 from transformers import CLIPTextModel, CLIPTokenizer
 from lib_omost.pipeline import StableDiffusionXLOmostPipeline
 from chat_interface import ChatInterface
+from transformers.generation.stopping_criteria import StoppingCriteriaList
 import lib_omost.canvas as omost_canvas
     streamer = TextIteratorStreamer(llm_tokenizer, timeout=10.0, skip_prompt=True, skip_special_tokens=True)
+    def interactive_stopping_criteria(input_ids: torch.LongTensor, score: torch.FloatTensor, **kwargs) -> bool:
+        if getattr(streamer, 'user_interrupted', False):
+            print('User stopped generation')
+            return True
+        else:
+            return False
+    stopping_criteria = StoppingCriteriaList([interactive_stopping_criteria])
+    def interrupter():
+        streamer.user_interrupted = True
+        return
     generate_kwargs = dict(
         input_ids=input_ids,
         streamer=streamer,
+        stopping_criteria=stopping_criteria,
         max_new_tokens=max_new_tokens,
         do_sample=True,
         temperature=temperature,
     for text in streamer:
         outputs.append(text)
         # print(outputs)
+        yield "".join(outputs), interrupter
     print(f'Chat end at {time.time() - time_stamp:.2f} seconds:', message)
     return

chat_interface.py CHANGED Viewed

@@ -20,7 +20,7 @@ from gradio.components import (
     State,
     Textbox,
     get_component_instance,
-    Dataset
 )
 from gradio.events import Dependency, on
 from gradio.helpers import special_args
@@ -103,6 +103,8 @@ class ChatInterface(Blocks):
         self.pre_fn = pre_fn
         self.pre_fn_kwargs = pre_fn_kwargs
         self.multimodal = multimodal
         self.concurrency_limit = concurrency_limit
         self.fn = fn
@@ -287,7 +289,7 @@ class ChatInterface(Blocks):
             .then(
                 submit_fn,
                 [self.saved_input, self.chatbot_state] + self.additional_inputs,
-                [self.chatbot, self.chatbot_state],
                 show_api=False,
                 concurrency_limit=cast(
                     Union[int, Literal["default"], None], self.concurrency_limit
@@ -395,6 +397,11 @@ class ChatInterface(Blocks):
     def _setup_stop_events(
         self, event_triggers: list[Callable], event_to_cancel: Dependency
     ) -> None:
         if self.stop_btn and self.is_generator:
             if self.submit_btn:
                 for event_trigger in event_triggers:
@@ -434,9 +441,8 @@ class ChatInterface(Blocks):
                     queue=False,
                 )
             self.stop_btn.click(
-                None,
-                None,
-                None,
                 cancels=event_to_cancel,
                 show_api=False,
             )
@@ -545,7 +551,7 @@ class ChatInterface(Blocks):
             )
             generator = SyncToAsyncIterator(generator, self.limiter)
         try:
-            first_response = await async_iteration(generator)
             if self.multimodal and isinstance(message, dict):
                 for x in message["files"]:
                     history.append([(x,), None])
@@ -553,21 +559,21 @@ class ChatInterface(Blocks):
                 yield update, update
             else:
                 update = history + [[message, first_response]]
-                yield update, update
         except StopIteration:
             if self.multimodal and isinstance(message, dict):
                 self._append_multimodal_history(message, None, history)
                 yield history, history
             else:
                 update = history + [[message, None]]
-                yield update, update
-        async for response in generator:
             if self.multimodal and isinstance(message, dict):
                 update = history + [[message["text"], response]]
                 yield update, update
             else:
                 update = history + [[message, response]]
-                yield update, update
     async def _api_submit_fn(
         self, message: str, history: list[list[str | None]], request: Request, *args

     State,
     Textbox,
     get_component_instance,
+    Dataset,
 )
 from gradio.events import Dependency, on
 from gradio.helpers import special_args
         self.pre_fn = pre_fn
         self.pre_fn_kwargs = pre_fn_kwargs
+        self.interrupter = State(None)
         self.multimodal = multimodal
         self.concurrency_limit = concurrency_limit
         self.fn = fn
             .then(
                 submit_fn,
                 [self.saved_input, self.chatbot_state] + self.additional_inputs,
+                [self.chatbot, self.chatbot_state, self.interrupter],
                 show_api=False,
                 concurrency_limit=cast(
                     Union[int, Literal["default"], None], self.concurrency_limit
     def _setup_stop_events(
         self, event_triggers: list[Callable], event_to_cancel: Dependency
     ) -> None:
+        def perform_interrupt(ipc):
+            if ipc is not None:
+                ipc()
+            return
         if self.stop_btn and self.is_generator:
             if self.submit_btn:
                 for event_trigger in event_triggers:
                     queue=False,
                 )
             self.stop_btn.click(
+                fn=perform_interrupt,
+                inputs=[self.interrupter],
                 cancels=event_to_cancel,
                 show_api=False,
             )
             )
             generator = SyncToAsyncIterator(generator, self.limiter)
         try:
+            first_response, first_interrupter = await async_iteration(generator)
             if self.multimodal and isinstance(message, dict):
                 for x in message["files"]:
                     history.append([(x,), None])
                 yield update, update
             else:
                 update = history + [[message, first_response]]
+                yield update, update, first_interrupter
         except StopIteration:
             if self.multimodal and isinstance(message, dict):
                 self._append_multimodal_history(message, None, history)
                 yield history, history
             else:
                 update = history + [[message, None]]
+                yield update, update, first_interrupter
+        async for response, interrupter in generator:
             if self.multimodal and isinstance(message, dict):
                 update = history + [[message["text"], response]]
                 yield update, update
             else:
                 update = history + [[message, response]]
+                yield update, update, interrupter
     async def _api_submit_fn(
         self, message: str, history: list[list[str | None]], request: Request, *args