Spaces:

srijaydeshpande
/

DeID

Sleeping

App Files Files Community

srijaydeshpande commited on Jun 5

Commit

aa98be2

•

1 Parent(s): b26fc16

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -12

app.py CHANGED Viewed

@@ -82,9 +82,9 @@ def txt_to_html(text):
 @spaces.GPU(duration=120)
 def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
-    prompt = "In the following text replace any person name and any address with term [redacted], replace any Date of Birth and NHS number with term [redacted]"
-    print('Control 0.5 -----------------------------------')
     # model_id = "models/Meta-Llama-3-70B-Instruct-Q3_K_M.gguf"
     # # model = Llama(model_path=model_id, n_ctx=2048, n_threads=8, n_gpu_layers=-1, n_batch=128)
     # model = Llama(
@@ -96,20 +96,16 @@ def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
     #             )
     chat_template = MessagesFormatterType.LLAMA_3
-    print('Control 1-----------------------------------')
     llm = Llama(
         model_path="models/Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",
         flash_attn=True,
-        n_gpu_layers=81,
         n_batch=1024,
         n_ctx=8192,
     )
-    print('Control 2-----------------------------------')
     provider = LlamaCppPythonProvider(llm)
-    print('Control 3-----------------------------------')
     agent = LlamaCppAgent(
         provider,
@@ -117,7 +113,6 @@ def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
         predefined_messages_formatter_type=chat_template,
         debug_output=True
     )
-    print('Control 4-----------------------------------')
     settings = provider.get_provider_default_settings()
     settings.temperature = 0.7
@@ -130,14 +125,13 @@ def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
     messages = BasicChatHistory()
     stream = agent.get_chat_response(
-        prompt,
         llm_sampling_settings=settings,
         chat_history=messages,
         returns_streaming_generator=True,
         print_output=False
     )
-    print('Control 5-----------------------------------')
-    print(stream)
     outputs = ""
     for output in stream:
         outputs += output

 @spaces.GPU(duration=120)
 def deidentify_doc(pdftext, maxtokens, temperature, top_probability):
+    # prompt = "In the following text replace any person name and any address with term [redacted], replace any Date of Birth and NHS number with term [redacted]"
+    prompt = "Anonymize the following report"
     # model_id = "models/Meta-Llama-3-70B-Instruct-Q3_K_M.gguf"
     # # model = Llama(model_path=model_id, n_ctx=2048, n_threads=8, n_gpu_layers=-1, n_batch=128)
     # model = Llama(
     #             )
     chat_template = MessagesFormatterType.LLAMA_3
     llm = Llama(
         model_path="models/Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",
         flash_attn=True,
+        n_gpu_layers=-1,
         n_batch=1024,
         n_ctx=8192,
     )
     provider = LlamaCppPythonProvider(llm)
     agent = LlamaCppAgent(
         provider,
         predefined_messages_formatter_type=chat_template,
         debug_output=True
     )
     settings = provider.get_provider_default_settings()
     settings.temperature = 0.7
     messages = BasicChatHistory()
     stream = agent.get_chat_response(
+        prompt + ' : ' + pdftext,
         llm_sampling_settings=settings,
         chat_history=messages,
         returns_streaming_generator=True,
         print_output=False
     )
     outputs = ""
     for output in stream:
         outputs += output