victormiller commited on
Commit
2b149b6
1 Parent(s): a47c727

Update results.py

Browse files
Files changed (1) hide show
  1. results.py +60 -8
results.py CHANGED
@@ -416,9 +416,57 @@ fig.update_layout(
416
  # Show the figure
417
  llama_graph2 = fig
418
 
419
-
420
  #llama graph 3
421
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
422
  import plotly.graph_objects as go
423
 
424
  # Data for different years and dump duplications
@@ -481,10 +529,10 @@ fig.update_layout(
481
  )
482
 
483
  # Show the figure
484
- llama_graph3 = fig
485
 
486
 
487
- #llama graph 4
488
 
489
  # Data for different buckets and years
490
  import plotly.graph_objects as go
@@ -549,9 +597,9 @@ fig.update_layout(
549
  )
550
 
551
  # Show the figure
552
- llama_graph4 = fig
553
 
554
- ##llama graph 5
555
 
556
  # Data for different years and duplication counts
557
  data = {
@@ -613,7 +661,7 @@ fig.update_layout(
613
  )
614
 
615
  # Show the figure
616
- llama_graph5 = fig
617
 
618
 
619
  intro_div = Div(
@@ -684,16 +732,20 @@ llama_div = Div(
684
  H3("Perplexity vs Dump Duplication"),
685
  Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
686
  plotly2fasthtml(llama_graph3),
 
 
 
 
687
  ),
688
  Section(
689
  H3("Perplexity vs Local Buckets"),
690
  Img(src="images/prep-diff-buckets-local.png", height = "300", width = "600" ),
691
- plotly2fasthtml(llama_graph4),
692
  ),
693
  Section(
694
  H3("Perplexity vs Local Dump Duplication"),
695
  Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
696
- plotly2fasthtml(llama_graph5),
697
  ),
698
  )
699
 
 
416
  # Show the figure
417
  llama_graph2 = fig
418
 
 
419
  #llama graph 3
420
 
421
+ # Data for different buckets and perplexity values across years
422
+ data = {
423
+ "1-1": {
424
+ "years": ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"],
425
+ "perplexities": [10.036774097041135, 9.46310273785878, 9.41413706166537, 9.50318602661455, 9.007669062339426, 8.388255660116407, 10.112246017864624, 10.239269162661959, 9.931951075969451, 8.646614152066428]
426
+ },
427
+ "2-5": {
428
+ "years": ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"],
429
+ "perplexities": [9.306693996275795, 8.763464863196129, 8.645126825996691, 9.473904977192573, 10.95829859145081, 10.676105294328789, 10.255251179892559, 9.54987953569235, 9.12737570591033, 8.806922449908505]
430
+ },
431
+ "6-10": {
432
+ "years": ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"],
433
+ "perplexities": [9.442327622499175, 9.075851726027564, 9.527148465147846, 9.755998086072951, 10.128151243953157, 9.728353939624842, 9.233548505479437, 9.067380903629866, 8.995868137602248, 8.816629232137835]
434
+ },
435
+ "11-100": {
436
+ "years": ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"],
437
+ "perplexities": [9.015408185880002, 8.868392446242012, 9.120345162203675, 8.968012141869462, 9.451949410987668, 9.381837094065533, 9.25131862646364, 9.014261939731549, 9.00805668763514, 8.995152677487027]
438
+ },
439
+ "101-1000": {
440
+ "years": ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"],
441
+ "perplexities": [9.94583162297666, 9.113560631617027, 8.9228845723255, 8.895860780054043, 8.863879736723902, 8.401723232809463, 8.458532176757009, 8.14345667720481, 7.882044010499616, 7.737747701620713]
442
+ },
443
+ "1001-30000000": {
444
+ "years": ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"],
445
+ "perplexities": [9.141712571508352, 8.037411460181893, 9.14052983061081, 8.757970647106037, 8.440366034517687, 7.5705604983353325, 7.4808205167223525, 7.312019290288715, 7.538858258386088, 6.77703951001925]
446
+ }
447
+ }
448
+
449
+ # Create figure
450
+ fig = go.Figure()
451
+
452
+ # Add traces for each bucket
453
+ for bucket, bucket_data in data.items():
454
+ fig.add_trace(go.Scatter(x=bucket_data["years"], y=bucket_data["perplexities"], mode='lines+markers', name=bucket))
455
+
456
+ # Update layout
457
+ fig.update_layout(
458
+ title="Perplexity Across Different Buckets (Global)",
459
+ xaxis_title="Year",
460
+ yaxis_title="Average Perplexity",
461
+ legend_title="Bucket (Duplicate Count Range)"
462
+ )
463
+
464
+ # Show the figure
465
+ llama_graph3 = fig
466
+
467
+
468
+ #llama graph 4
469
+
470
  import plotly.graph_objects as go
471
 
472
  # Data for different years and dump duplications
 
529
  )
530
 
531
  # Show the figure
532
+ llama_graph4 = fig
533
 
534
 
535
+ #llama graph 5
536
 
537
  # Data for different buckets and years
538
  import plotly.graph_objects as go
 
597
  )
598
 
599
  # Show the figure
600
+ llama_graph5 = fig
601
 
602
+ ##llama graph 6
603
 
604
  # Data for different years and duplication counts
605
  data = {
 
661
  )
662
 
663
  # Show the figure
664
+ llama_graph6 = fig
665
 
666
 
667
  intro_div = Div(
 
732
  H3("Perplexity vs Dump Duplication"),
733
  Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
734
  plotly2fasthtml(llama_graph3),
735
+ Section(
736
+ H3("Perplexity vs Dump Duplication"),
737
+ Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
738
+ plotly2fasthtml(llama_graph4),
739
  ),
740
  Section(
741
  H3("Perplexity vs Local Buckets"),
742
  Img(src="images/prep-diff-buckets-local.png", height = "300", width = "600" ),
743
+ plotly2fasthtml(llama_graph5),
744
  ),
745
  Section(
746
  H3("Perplexity vs Local Dump Duplication"),
747
  Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
748
+ plotly2fasthtml(llama_graph6),
749
  ),
750
  )
751