Spaces:

LLM360
/

TxT360

Running

hunterhector commited on Oct 7

Commit

9cbd894

•

1 Parent(s): 4cc0103

work on some section stuff

Files changed (4) hide show

common.py CHANGED Viewed

@@ -464,7 +464,6 @@ global_div = Div(
             style="display: flex; justify-content: center; align-items: center; width: 100%; max-width: 100%; height: auto; overflow-x: auto;"
         )
     ),
-    Section(H3("Conclusion"), P("NEED TO UPDATE")),
 )

             style="display: flex; justify-content: center; align-items: center; width: 100%; max-width: 100%; height: auto; overflow-x: auto;"
         )
     ),
 )

curated.py CHANGED Viewed

@@ -1722,11 +1722,12 @@ def curated():
     return Div(
         Section(
             overview,
         ),
         Section(
             curated_sources_intro,
             plotly2fasthtml(treemap_chart),
-            id="section31",
         ),
         Section(
             data_preprocessing_div,

     return Div(
         Section(
             overview,
+            id="section31",
         ),
         Section(
             curated_sources_intro,
             plotly2fasthtml(treemap_chart),
+            # id="section31",
         ),
         Section(
             data_preprocessing_div,

main.py CHANGED Viewed

@@ -874,6 +874,10 @@ def intro():
                 D_cite(bibtex_key="redpajama-v2"),
                 "we also hope to provide a dataset at this scale that is ready to go, without requiring futher filtering."
             ),
             id="section11",
         ),
         Section(

                 D_cite(bibtex_key="redpajama-v2"),
                 "we also hope to provide a dataset at this scale that is ready to go, without requiring futher filtering."
             ),
+            P(
+                B("How to Reaad this Blog Post?"),
+                P("This document contains all the details and is lengthy. We recommend readers to use the Table of Contents to jump to the appropriate sections. At each top level section, we provided a quick guide for the content. We also recommend readers to consider this post as a reference for some high level statistics related to pre-training datasets.")
+            ),
             id="section11",
         ),
         Section(

results.py CHANGED Viewed

@@ -764,7 +764,7 @@ intro_div = Div(
         Li("The Learning Curve of TxT360 with an Upsampling Recipe", style = "margin-bottom: 5px"),
         Li("Perplexity Analysis across time", style = "margin-bottom: 5px"),
         Li("Topic Analysis on Data Cluster Groups", style = "margin-bottom: 5px"),
-        Li(B("Estimated Reading Time: 15 minutes"), style = "margin-bottom: 5px"),
     ),
 )

         Li("The Learning Curve of TxT360 with an Upsampling Recipe", style = "margin-bottom: 5px"),
         Li("Perplexity Analysis across time", style = "margin-bottom: 5px"),
         Li("Topic Analysis on Data Cluster Groups", style = "margin-bottom: 5px"),
+        Li(B("Estimated Reading Time: 25 minutes"), style = "margin-bottom: 5px"),
     ),
 )