victormiller commited on
Commit
d875a86
1 Parent(s): aee89d3

Update results.py

Browse files
Files changed (1) hide show
  1. results.py +46 -17
results.py CHANGED
@@ -9,30 +9,59 @@ import plotly.express as px
9
 
10
  ##upsampling validation loss graph
11
 
 
12
 
13
- # Load the CSV file
14
- data = pd.read_csv('data/validation_loss _txt360_vs_fineweb.csv')
15
-
16
- # Create a plotly line chart
17
- fig = go.Figure()
18
-
19
- # Add the line for FineWeb-1.5T
20
- fig.add_trace(go.Scatter(x=data['Step'], y=data['FineWeb-1.5T'], mode='lines', name='FineWeb-1.5T'))
21
-
22
- # Add the line for TxT360
23
- fig.add_trace(go.Scatter(x=data['Step'], y=data['TxT360'], mode='lines', name='TxT360'))
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
 
25
  # Update layout
26
- fig.update_layout(
27
- title='Validation Loss Comparison: TxT360 vs FineWeb-1.5T',
28
  xaxis_title='Steps',
29
- yaxis_title='Validation Loss',
30
- legend_title='Dataset',
31
- template='plotly_white'
32
  )
33
 
 
 
34
  # Show the plot
35
- validation_loss_graph = fig
36
 
37
 
38
 
 
9
 
10
  ##upsampling validation loss graph
11
 
12
+ import plotly.graph_objects as go
13
 
14
+ # Data
15
+ steps = [5000, 10000, 15000, 20000, 25000, 30000, 35000, 40000, 45000, 50000,
16
+ 55000, 60000, 65000, 70000, 75000, 80000, 85000, 90000, 95000, 100000,
17
+ 105000, 110000, 115000, 120000, 125000, 130000, 135000, 140000, 145000,
18
+ 150000, 155000, 160000, 165000, 170000, 175000, 180000, 185000, 190000,
19
+ 195000, 200000, 205000, 210000, 215000, 220000, 225000, 230000, 235000,
20
+ 240000, 245000, 250000, 255000, 260000, 265000, 270000, 275000, 280000,
21
+ 285000]
22
+
23
+ fineweb = [2.911076784, 2.75819993, 2.647450924, 2.588769436, 2.565514088,
24
+ 2.527409077, 2.506954193, 2.493706465, 2.478432178, 2.476668596,
25
+ 2.467983723, 2.4843328, 2.439449787, 2.438807011, 2.426213741,
26
+ 2.459792614, 2.426000357, 2.403300762, 2.399668455, 2.404176235,
27
+ 2.39425993, 2.406329632, 2.381269455, 2.387765169, 2.373465776,
28
+ 2.374938488, 2.379047394, 2.370839834, 2.351930141, 2.35353899,
29
+ 2.356842279, 2.343327522, 2.335564375, 2.337301254, 2.322228193,
30
+ 2.323165655, 2.309478998, 2.326301336, 2.314562321, 2.280953169,
31
+ 2.291109324, 2.298957586, 2.282609463, 2.296112061, 2.286119938,
32
+ 2.279724598, 2.268625498, 2.27303195, 2.254729986, 2.260175228,
33
+ 2.248331785, 2.235989809, 2.241044521, 2.242579222, 2.216429472,
34
+ 2.250077009, 2.224117756]
35
+
36
+ txt360 = [2.589649677, 2.438303471, 2.383416414, 2.337049007, 2.300292492,
37
+ 2.29057312, 2.285922527, 2.265408278, 2.245058537, 2.24157238,
38
+ 2.23307991, 2.232925415, 2.226780653, 2.222440243, 2.194804668,
39
+ 2.210517406, 2.186522722, 2.185292006, 2.184529305, 2.185826778,
40
+ 2.171881914, 2.182652235, 2.169103146, 2.162784815, 2.165525436,
41
+ 2.159037828, 2.164080143, 2.143726826, 2.144924164, 2.138051987,
42
+ 2.138092995, 2.120969057, None, None, None, None, None, None, None,
43
+ None, None, None, None, None, None, None, None, None, None, None,
44
+ None, None, None, None, None, None, None, None, None, None]
45
+
46
+ # Plot
47
+ fig_val = go.Figure()
48
+
49
+ # Add lines
50
+ fig_val.add_trace(go.Scatter(x=steps, y=fineweb, mode='lines', name='FineWeb-1.5T'))
51
+ fig_val.add_trace(go.Scatter(x=steps, y=txt360, mode='lines', name='TxT360'))
52
 
53
  # Update layout
54
+ fig_val.update_layout(
55
+ title='Perplexity Across Steps',
56
  xaxis_title='Steps',
57
+ yaxis_title='Perplexity',
58
+ legend_title='Models'
 
59
  )
60
 
61
+ # Show plot
62
+
63
  # Show the plot
64
+ validation_loss_graph = fig_val
65
 
66
 
67