victormiller commited on
Commit
01126c7
1 Parent(s): 12aa2bb

Update results.py

Browse files
Files changed (1) hide show
  1. results.py +67 -2
results.py CHANGED
@@ -418,7 +418,72 @@ llama_graph2 = fig
418
 
419
 
420
  #llama graph 3
421
- #tbd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
422
  #llama graph 4
423
 
424
  # Data for different buckets and years
@@ -618,7 +683,7 @@ llama_div = Div(
618
  Section(
619
  H3("Perplexity vs Dump Duplication"),
620
  Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
621
- #plotly2fasthtml(llama_graph3),
622
  ),
623
  Section(
624
  H3("Perplexity vs Local Buckets"),
 
418
 
419
 
420
  #llama graph 3
421
+
422
+ import plotly.graph_objects as go
423
+
424
+ # Data for different years and dump duplications
425
+ data = {
426
+ "2014": {
427
+ "dumps": [1, 2, 3, 4, 5, 6, 7],
428
+ "perplexities": [9.73915022954687, 8.917501442736835, 10.870824235415164, 8.839485979263355, 9.114611185408386, 9.00595271327483, 9.069847072965578]
429
+ },
430
+ "2015": {
431
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14],
432
+ "perplexities": [9.219127989173247, 8.610711104284512, 8.505043568675715, 7.990039784261444, 8.107957918641446, 8.796945238229792, 8.013223752027935, 8.890635712836795, 8.83059261426682, 10.04094169141142, 8.570752850736193, 9.003542320883396, 8.587190578806105, 7.983045509484727]
433
+ },
434
+ "2016": {
435
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23],
436
+ "perplexities": [9.224890447512712, 8.982140506828461, 7.624091188629551, 8.97063321078077, 8.261724045845817, 7.793111396647548, 7.829316622145423, 8.597365842164928, 9.301981760525631, 9.66361415155858, 9.258511719598742, 9.441774097297651, 9.429412341325685, 9.325699904738741, 8.836147021549138, 8.607104273128627, 8.722839588316196, 8.920039351586981, 8.914454312645233, 8.899123060759182, 9.793833500279591, 10.134616145581552, 8.353063455545444]
437
+ },
438
+ "2017": {
439
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34],
440
+ "perplexities": [9.488743166894329, 9.683975569858143, 8.654505727247006, 8.066421362212841, 8.395709115228499, 8.500311197527102, 9.10900254771213, 7.794618707693523, 8.059130491102199, 7.840987528913394, 8.94443662009675, 8.811736884161157, 9.395950762255111, 8.88696403862443, 9.064476456994532, 9.474527237081157, 8.91858984698398, 9.008242064314263, 8.840440114974651, 7.978242830053041, 8.653702083122754, 9.395390940155544, 8.644847872201382, 9.017641716864084, 8.731668787167907, 7.294766100138992, 9.116288498873331, 8.812157001137116, 8.229244256822179, 10.705494840702238, 8.4287361645181, 9.127134117671186, 8.418280990577143, 8.223315656547781]
441
+ },
442
+ "2018": {
443
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46],
444
+ "perplexities": [9.896529727642656, 9.375668627700882, 9.53229676611742, 9.709666311696747, 9.371857870215996, 9.756320954898577, 9.3489352873219, 9.41874088848098, 9.220103832539115, 9.493717136086154, 9.894783254332049, 10.271325431375882, 9.444295310961042, 9.259722713114918, 9.121852071096205, 10.266770364074752, 9.322189177071575, 9.200133535506806, 9.391739906453976, 9.166754675924274, 9.386922783373333, 9.269174320074539, 8.921691129048623, 8.500872698966008, 8.427801104408742, 8.957096089538366, 8.843138224464884, 8.839757712227849, 8.730159045861498, 8.761283943113895, 8.955585790830773, 9.480108588809301, 8.975279317370992, 8.647350666497408, 8.040519395112794, 8.154306078995903, 9.047836211768528, 8.388013770335506, 9.27023552172876, 8.392778372966038, 9.698769530780428, 8.48774562040954, 9.832837942793894, 8.801856106666897, 9.090280166741453, 8.066384841477534]
445
+ },
446
+ "2019": {
447
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58],
448
+ "perplexities": [9.32068228893817, 11.36279410700072, 9.729296413744873, 10.951540717951199, 9.571599362297537, 8.746033912439227, 8.911359607667526, 8.652716464937903, 8.90908579802875, 9.526405246155608, 8.84494033246573, 9.45556467668226, 9.61666194147301, 9.471820461436957, 9.385272422926384, 9.300484355205835, 9.374562863672638, 8.921445075261644, 8.457279643164815, 8.911117277418406, 8.076917631172464, 8.58392948648068, 9.138574660565174, 9.03583800697058, 8.706482138788626, 8.581302039813796, 8.567006611519137, 5.454819541045107, 8.380493341695487, 8.129823277176698, 7.346580306828866, 8.182982036096053, 8.03219664626822, 8.434163783307083, 8.148075720769123, 8.20825575224898, 7.7034049100948945, 8.319494286475098, 8.449794025203127, 8.40448676995273, 8.394065958286836, 8.431905407945235, 8.684778696918817, 10.170628597487527, 7.685742913353763, 8.317540224765809, 7.100457493121143, 5.389889122637774, 6.52302432138372, 8.895820543553361, 8.540964121500908, 5.823656104193133, 8.946389481295038, 8.03972593805594, 7.406476375508138, 7.434287132433397, 8.592981328562821, 9.803727252301018],
449
+ },
450
+ "2020": {
451
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67],
452
+ "perplexities": [10.012609650486192, 7.943056443498068, 8.44096110442561, 9.029669769296477, 8.409724985539306, 8.731282990251563, 8.434833756562051, 8.497304934371442, 8.467244156051745, 8.606236488210545, 8.805728093624284, 9.375705002747582, 9.21767027458378, 9.048307919892986, 9.77562185114431, 8.730686261181575, 9.434356327584526, 9.119611839878791, 9.17722037907838, 8.569631235903184, 8.899794145233415, 9.315415673275877, 8.170599811786479, 8.538223762760031, 8.19667246899941, 8.740262061758479, 8.335448351341697, 8.321473204597588, 8.505543388481339, 8.552966240767482, 8.350236112276809, 8.109081033072668, 8.539929546398097, 8.535623890267809, 8.152345891530405, 8.399872141360548, 7.737922667873269, 8.15695720088359, 8.175043636189214, 7.595645045643389, 7.911222051300795, 8.645606075472527, 8.114112476153545, 8.054768997187903, 7.800103557084926, 8.096027154350947, 8.10653262234877, 8.029447458295808, 7.192697926255588, 9.370330492895473, 8.523467886567657, 7.313215625083473, 8.839958839301076, 8.656716147817143, 8.137974531785895, 8.523363904379156, 6.108894835851177, 7.818953624010673, 8.49431208395812, 8.342596121020756, 7.742470144320784, 6.682052985671971, 6.759804959168626, 9.093551460193316, 7.062030527371495, 8.434506543833649, 6.781692983120098],
453
+ },
454
+ "2021": {
455
+ "dumps": 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76],
456
+ "perplexities": [9.841089195168713, 8.366233239891208, 8.059521351436208, 8.318918468325863, 8.324706089968892, 8.32605366049384, 8.435930736985704, 8.66800508008913, 8.406990633173743, 8.962431358959584, 8.850717354466074, 9.1716199955458, 9.302688993535714, 8.939046098190769, 9.051679849424985, 8.682789687366284, 8.994991585405426, 8.561380912367396, 8.787500555168679, 8.843251281455629, 8.7217706466806, 8.381660448144187, 9.395216774912862, 8.591359926732526, 8.453429031525232, 8.456509570151965, 8.628116911794814, 8.53819222436614, 8.730438299562152, 9.376235492300244, 8.15154442462199, 8.54875158466325, 8.163866477674533, 8.304409143008455, 8.856929571720633, 8.167913697870857, 7.84492260274128, 8.162407286516313, 8.321838697740313, 8.253127215455834, 8.248563253933684, 8.499374467029739, 8.680742460396948, 7.967559876484448, 8.095069183089077, 7.912424470771882, 7.7624804836167565, 7.807769541801359, 8.016590141394108, 7.6555859978103316, 8.416070459989983, 7.512191560306614, 7.994576039964321, 7.185188422240499, 7.660311594811295, 7.23106290817905, 6.982644852723388, 7.843742555580493, 7.005057894403877, 8.430250121211994, 5.657881355879867, 6.726292542438366, 7.486937111190708, 7.712303495834796, 6.246962399681747, 6.92875404699629, 5.329766234792039, 5.709327997807491, 7.971206942045293, 5.686373279239376, 6.1781744792525615, 8.241084719551052, 8.439160967397711, 7.65310078654845, 6.327069191350794, 3.91910919080523],
457
+ },
458
+ "2022": {
459
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82],
460
+ "perplexities": [9.483592568856565, 7.189994228954454, 8.316909239194644, 7.86424678656687, 9.220674611582542, 8.321976529350732, 9.10888002884781, 8.225969911900018, 8.384237608546773, 8.780327271679809, 9.364145618644377, 9.495859713757827, 9.106949174218812, 9.23421176581141, 9.163921762844911, 8.794794461344875, 8.828930317074237, 8.910619607048394, 8.875861267417038, 8.806690212582172, 9.061056708418198, 8.866883414667015, 8.67286618308663, 8.682273027254936, 8.305102405030174, 8.189733511502775, 8.924337748216326, 8.659728319566609, 8.444422835653581, 8.755250021389994, 8.000000289145156, 8.081525926632303, 8.061721834769063, 7.895475427973516, 8.287032632326136, 8.472773038016852, 7.663326197885218, 7.847535650315383, 7.732755997953167, 7.960257016089297, 7.608447426559309, 7.598389147784626, 7.946761405541756, 7.773873549407202, 8.126908611820289, 7.916664649722816, 7.894622086606636, 7.680503580812927, 7.727898320658088, 7.432772901777352, 8.202398282489195, 8.042184753937285, 7.73548358717129, 7.682704039184239, 8.158164009607694, 7.345186708566949, 7.828163052277644, 7.611824744941703, 7.241808787698759, 7.582892852952833, 7.879397809151155, 7.134581497547041, 7.78667356422719, 6.656397614763345, 7.023352560594163, 7.362930730205023, 7.3699197483652386, 6.7454140379422265, 5.903262622771099, 6.434879224359672, 7.306608742238141, 7.9100884219615555, 7.924947631037447, 8.120669403708789, 7.8919156097528464, 7.295660656533646, 5.599201327007343, 5.260468504600074, 6.889443342018529, 5.396932289937023, 6.7357812331788285, 7.079240389198726],
461
+ },
462
+ "2023": {
463
+ "dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87]
464
+ "perplexities": [8.70489099557147, 7.743567081947979, 5.707700759513075, 7.42267071929539, 7.528257194741652, 6.766266255314377, 8.140487690026744, 7.968460364579144, 8.378534732391445, 8.462864835761868, 8.750163467122363, 9.030159982511133, 8.947498611252533, 9.26185161266797, 9.148155404351185, 9.160868347246595, 9.132536983584458, 9.12916497406581, 9.027825944368539, 9.127169658958355, 9.087762413460762, 9.288851446582335, 9.21606664952798, 9.10292838042461, 9.142519978568224, 8.822355646917647, 8.900446619619732, 8.79981304565808, 8.918708459617246, 9.13267243596762, 8.759214105765599, 8.961577284078654, 8.12181490449537, 8.43888231714366, 8.724831350613316, 8.258762532936931, 8.337583232620341, 8.223678511207945, 8.19914152935067, 8.250449659843008, 8.488274186714182, 8.063794656047826, 8.267469501822353, 8.109403400519883, 7.897519766033864, 8.029859903259943, 8.01415790723292, 7.852726835204203, 7.524006414246027, 8.016485804552786, 8.181980185953115, 7.7865858384362445, 7.630488133713028, 7.744179998387641, 7.9618609986528766, 7.818104340203628, 7.873732400580378, 7.643522973769515, 7.743819932052891, 7.603304862075835, 7.499516191588959, 7.919857492185231, 7.294200517555408, 7.835098137549298, 7.562994060655124, 7.426074658906729, 7.4503303575596185, 7.6402144041645315, 6.889172499203354, 7.869082402525025, 7.476479798274207, 7.46012411648056, 7.016878527752248, 7.233305845472016, 6.657949958745544, 6.2352925881040875, 6.558931554888652, 6.094819134587699, 6.444696396841287, 5.338755088514068, 5.367611973164904, 5.425863412036782, 4.20042362030674, 5.111941016244413, 5.149295160813693, 3.9082208202377435, 2.6866750639387136],
465
+ },
466
+ }
467
+
468
+ # Create figure
469
+ fig = go.Figure()
470
+
471
+ # Add traces for each year
472
+ for year, year_data in data.items():
473
+ fig.add_trace(go.Scatter(x=year_data["dumps"], y=year_data["perplexities"], mode='lines+markers', name=year))
474
+
475
+ # Update layout
476
+ fig.update_layout(
477
+ title="Perplexity Across Different Dump Duplication Counts (Global)",
478
+ xaxis_title="Number of Dumps Duplication",
479
+ yaxis_title="Average Perplexity",
480
+ legend_title="Year"
481
+ )
482
+
483
+ # Show the figure
484
+ llama_graph3 = fig
485
+
486
+
487
  #llama graph 4
488
 
489
  # Data for different buckets and years
 
683
  Section(
684
  H3("Perplexity vs Dump Duplication"),
685
  Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
686
+ plotly2fasthtml(llama_graph3),
687
  ),
688
  Section(
689
  H3("Perplexity vs Local Buckets"),