TxT360

Sleeping

victormiller commited on Sep 26

Commit

4028499

•

1 Parent(s): 9f87a47

Update curated.py

Files changed (1) hide show

curated.py CHANGED Viewed

@@ -7,6 +7,7 @@ import json
 from data_viewer import view_data, gen_random_id
 from rich import print
 import uuid
 overview_text = P("Curated sources comprise high-quality datasets that contain domain-specificity. These sources, such as Arxiv, Wikipedia, and Stack Exchange, provide valuable data that is excluded from the web dataset mentioned above. Analyzing and processing non-web data can yield insights and opportunities for various applications. Details about each of the sources are provided below. ")
 copyright_disclaimer = P("We respect the copyright of the data sources and have not included the controversial data that was used in Pile like YouTube and Opensubtitles, Reddit threads, and books.")

 from data_viewer import view_data, gen_random_id
 from rich import print
 import uuid
+import plotly.express as px
 overview_text = P("Curated sources comprise high-quality datasets that contain domain-specificity. These sources, such as Arxiv, Wikipedia, and Stack Exchange, provide valuable data that is excluded from the web dataset mentioned above. Analyzing and processing non-web data can yield insights and opportunities for various applications. Details about each of the sources are provided below. ")
 copyright_disclaimer = P("We respect the copyright of the data sources and have not included the controversial data that was used in Pile like YouTube and Opensubtitles, Reddit threads, and books.")