Spaces:

NeuML
/

txtai

Running

App Files Files Community

davidmezzetti commited on Nov 9, 2021

Commit

e43b653

•

1 Parent(s): 09a5aa4

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -15

app.py CHANGED Viewed

@@ -13,7 +13,7 @@ import pandas as pd
 import streamlit as st
 from txtai.embeddings import Documents, Embeddings
-from txtai.pipeline import Segmentation, Summary, Tabular, Textractor, Transcription, Translation
 from txtai.workflow import ServiceTask, Task, UrlTask, Workflow
@@ -94,11 +94,8 @@ class Application:
             options["minlength"] = self.number("Min length")
             options["maxlength"] = self.number("Max length")
-        elif component in ("segment", "textract"):
-            if component == "segment":
-                st.sidebar.markdown("**Segment**  \n*Split text into semantic units*")
-            else:
-                st.sidebar.markdown("**Textractor**  \n*Extract text from documents*")
             options["sentences"] = st.sidebar.checkbox("Split sentences")
             options["lines"] = st.sidebar.checkbox("Split lines")
@@ -172,10 +169,6 @@ class Application:
                 self.pipelines[wtype] = Tabular(**self.components["tabular"])
                 tasks.append(Task(self.pipelines["tabular"]))
-            elif wtype == "textract":
-                self.pipelines[wtype] = Textractor(**self.components["textract"])
-                tasks.append(UrlTask(self.pipelines["textract"]))
             elif wtype == "transcribe":
                 self.pipelines[wtype] = Transcription(component.pop("path"))
                 tasks.append(UrlTask(self.pipelines["transcribe"], r".\.wav$"))
@@ -223,10 +216,6 @@ class Application:
                 data["tabular"] = component
                 tasks.append({"action": "tabular"})
-            elif wtype == "textract":
-                data["textractor"] = component
-                tasks.append({"action": "textractor", "task": "url"})
             elif wtype == "transcribe":
                 data["transcription"] = {"path": component.pop("path")}
                 tasks.append({"action": "transcription", "task": "url"})
@@ -341,7 +330,7 @@ class Application:
         st.sidebar.markdown("# Workflow builder  \n*Build and apply workflows to data*  ")
         # Get selected components
-        components = ["embeddings", "segment", "service", "summary", "tabular", "textract", "transcribe", "translate"]
         selected = st.sidebar.multiselect("Select components", components)
         # Get selected options

 import streamlit as st
 from txtai.embeddings import Documents, Embeddings
+from txtai.pipeline import Segmentation, Summary, Tabular, Transcription, Translation
 from txtai.workflow import ServiceTask, Task, UrlTask, Workflow
             options["minlength"] = self.number("Min length")
             options["maxlength"] = self.number("Max length")
+        elif component == "segment:"
+            st.sidebar.markdown("**Segment**  \n*Split text into semantic units*")
             options["sentences"] = st.sidebar.checkbox("Split sentences")
             options["lines"] = st.sidebar.checkbox("Split lines")
                 self.pipelines[wtype] = Tabular(**self.components["tabular"])
                 tasks.append(Task(self.pipelines["tabular"]))
             elif wtype == "transcribe":
                 self.pipelines[wtype] = Transcription(component.pop("path"))
                 tasks.append(UrlTask(self.pipelines["transcribe"], r".\.wav$"))
                 data["tabular"] = component
                 tasks.append({"action": "tabular"})
             elif wtype == "transcribe":
                 data["transcription"] = {"path": component.pop("path")}
                 tasks.append({"action": "transcription", "task": "url"})
         st.sidebar.markdown("# Workflow builder  \n*Build and apply workflows to data*  ")
         # Get selected components
+        components = ["embeddings", "segment", "service", "summary", "tabular", "transcribe", "translate"]
         selected = st.sidebar.multiselect("Select components", components)
         # Get selected options