Spaces:

Overthrow4232
/

SaT

Runtime error

App Files Files Community

Overthrow4232 commited on Aug 3

Commit

04ca745

•

1 Parent(s): 809eaa8

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -16

app.py CHANGED Viewed

@@ -1,4 +1,3 @@
-import spaces
 import gradio as gr
 from wtpsplit import SaT
 import json
@@ -7,22 +6,20 @@ import json
 sat = SaT("sat-12l-sm")
 sat.half().to("cuda")
-@spaces.GPU(duration=59)
-def segment_text(input_text, txt_file):
     results = {}
     if input_text:
         # Process single text input
         sentences = sat.split(input_text)
         results["input_text"] = {"segments": sentences}
-    elif txt_file is not None:
-        # Process txt file
-        with open(txt_file.name, 'r', encoding='utf-8') as file:
-            for i, line in enumerate(file, 1):
-                line = line.strip()
-                if line:  # Skip empty lines
-                    sentences = sat.split(line)
-                    results[f"document_{i}"] = {"segments": sentences}
     # Create a JSON object with the results
     json_output = json.dumps(results, indent=2)
@@ -34,15 +31,16 @@ iface = gr.Interface(
     fn=segment_text,
     inputs=[
         gr.Textbox(lines=5, label="Input Text (Optional)"),
-        gr.File(label="Upload TXT file (Optional) Row-separated", file_types=[".txt"])
     ],
     outputs=gr.JSON(label="Segmented Text (JSON)"),
     title="Text Segmentation with SaT",
-    description="This app uses the SaT (Segment any Text) model to split input text into sentences and return the result as JSON. You can input text directly or upload a TXT file containing multiple documents (one per line). All credits to the respective author(s). Github: https://github.com/segment-any-text/wtpsplit/tree/main",
     examples=[
-        ["This is a test This is another test.", None],
-        ["Hello this is a test But this is different now Now the next one starts looool", None],
-        ["The quick brown fox jumps over the lazy dog It was the best of times, it was the worst of times", None],
     ]
 )

 import gradio as gr
 from wtpsplit import SaT
 import json
 sat = SaT("sat-12l-sm")
 sat.half().to("cuda")
+def segment_text(input_text, multi_doc_input):
     results = {}
     if input_text:
         # Process single text input
         sentences = sat.split(input_text)
         results["input_text"] = {"segments": sentences}
+    if multi_doc_input:
+        # Process multiple documents
+        documents = [doc.strip() for doc in multi_doc_input.split('\n') if doc.strip()]
+        for i, doc in enumerate(documents, 1):
+            sentences = sat.split(doc)
+            results[f"row_{i}"] = {"segments": sentences}
     # Create a JSON object with the results
     json_output = json.dumps(results, indent=2)
     fn=segment_text,
     inputs=[
         gr.Textbox(lines=5, label="Input Text (Optional)"),
+        gr.Textbox(lines=10, label="Multiple Documents (Optional, one per line)")
     ],
     outputs=gr.JSON(label="Segmented Text (JSON)"),
     title="Text Segmentation with SaT",
+    description="This app uses the SaT (Segment any Text) model to split input text into sentences and return the result as JSON. You can input text directly or provide multiple documents (one per line). All credits to the respective author(s). Github: https://github.com/segment-any-text/wtpsplit/tree/main",
     examples=[
+        ["This is a test This is another test.", ""],
+        ["Hello this is a test But this is different now Now the next one starts looool", ""],
+        ["The quick brown fox jumps over the lazy dog It was the best of times, it was the worst of times", ""],
+        ["", "Document 1 first sentence Document 1 second sentence\nDocument 2 only sentence\nDocument 3 first Document 3 second"]
     ]
 )