TxT360 / results.py
hunterhector's picture
work on some section stuff
9cbd894
from fasthtml.common import *
from fasthtml.components import *
from fasthtml.components import (
D_cite,
)
import os
import json
from fh_plotly import plotly2fasthtml
from plotly import graph_objects as go
import pandas as pd
import plotly.express as px
from eval_result_figures import all_eval_res_figs
##upsampling validation loss graph
# Data
steps = [5000, 10000, 15000, 20000, 25000, 30000, 35000, 40000, 45000, 50000,
55000, 60000, 65000, 70000, 75000, 80000, 85000, 90000, 95000, 100000,
105000, 110000, 115000, 120000, 125000, 130000, 135000, 140000, 145000,
150000, 155000, 160000, 165000, 170000, 175000, 180000, 185000, 190000,
195000, 200000, 205000, 210000, 215000, 220000, 225000, 230000, 235000,
240000, 245000, 250000, 255000, 260000, 265000, 270000, 275000, 280000,
285000]
fineweb = [2.911076784, 2.75819993, 2.647450924, 2.588769436, 2.565514088,
2.527409077, 2.506954193, 2.493706465, 2.478432178, 2.476668596,
2.467983723, 2.4843328, 2.439449787, 2.438807011, 2.426213741,
2.459792614, 2.426000357, 2.403300762, 2.399668455, 2.404176235,
2.39425993, 2.406329632, 2.381269455, 2.387765169, 2.373465776,
2.374938488, 2.379047394, 2.370839834, 2.351930141, 2.35353899,
2.356842279, 2.343327522, 2.335564375, 2.337301254, 2.322228193,
2.323165655, 2.309478998, 2.326301336, 2.314562321, 2.280953169,
2.291109324, 2.298957586, 2.282609463, 2.296112061, 2.286119938,
2.279724598, 2.268625498, 2.27303195, 2.254729986, 2.260175228,
2.248331785, 2.235989809, 2.241044521, 2.242579222, 2.216429472,
2.250077009, 2.224117756]
txt360 = [2.589649677, 2.438303471, 2.383416414, 2.337049007, 2.300292492,
2.29057312, 2.285922527, 2.265408278, 2.245058537, 2.24157238,
2.23307991, 2.232925415, 2.226780653, 2.222440243, 2.194804668,
2.210517406, 2.186522722, 2.185292006, 2.184529305, 2.185826778,
2.171881914, 2.182652235, 2.169103146, 2.162784815, 2.165525436,
2.159037828, 2.164080143, 2.143726826, 2.144924164, 2.138051987,
2.138092995, 2.120969057, None, None, None, None, None, None, None,
None, None, None, None, None, None, None, None, None, None, None,
None, None, None, None, None, None, None, None, None, None]
# Plot
fig_val = go.Figure()
# Add lines
fig_val.add_trace(go.Scatter(x=steps, y=fineweb, mode='lines', name='FineWeb'))
fig_val.add_trace(go.Scatter(x=steps, y=txt360, mode='lines', name='TxT360'))
# Update layout
fig_val.update_layout(
title='Validation Loss Over Steps: TxT360 vs FineWeb',
xaxis_title='Steps',
yaxis_title='Loss',
legend_title='Models'
)
# Show the plot
validation_loss_graph = fig_val
## lm loss graph
# Load the data from the cleaned dataset
data = pd.read_csv('data/lm_loss_txt360_fineweb.csv') # Replace with your actual file path
# Create the plot
fig_loss = go.Figure()
# Add TxT360 line
fig_loss.add_trace(go.Scatter(x=data['Step'], y=data['TxT360'], mode='lines', name='TxT360'))
# Add FineWeb line
fig_loss.add_trace(go.Scatter(x=data['Step'], y=data['FineWeb'], mode='lines', name='FineWeb'))
# Update layout
fig_loss.update_layout(
title="LM Loss Over Steps: TxT360 vs FineWeb",
xaxis_title="Steps",
yaxis_title="Loss",
legend_title="Models",
)
# Display the graph
lm_loss_graph = fig_loss
data = {
"1-1": [17.410227605477868, 17.446573602753478,17.307221780905284,17.338525603992114,17.08551151136689,16.818363305107052,16.98821894111693, 17.125795647512877,16.573462144306383, 15.4293630385597],
"2-5": [16.11176217183986,16.14852530113782,16.297702171159543,15.960924352297502,16.187802102106698,16.474269837858706,15.936494557783181, 15.780419457145868,15.283018703313582, 14.608379914730168],
"6-10": [15.632757662414805,15.627408549576069,15.948641884223639,15.912187993988933,14.935072408852303,14.944741674400241,14.79960386342691,14.631430892394002, 14.378277745163881,14.118271697056592],
"11-100": [15.446116676532212,15.0055028132117,14.799690714225637,14.822102470001267,14.832038213200583,14.568394784374943,14.435682562274105,14.276477514399625, 14.0611924390084,13.880215644749589],
"101-1000": [16.716943171826703,15.565430373421485,14.935989931859659,14.778913482337416,14.508674264491997,14.690158822673334,14.58651834886038,14.337146941773641,13.9886330091318,13.767106666731275 ],
"1001-30000000": [18.156821563322765,17.314701050452452,16.09585768919658,15.428145290012955, 14.800605964649103, 15.990949424635108,15.869365567783806,15.872474774329305, 15.769421394877273, 15.05749135510839],
}
# Years for the x-axis
years = ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"]
# Create a plotly figure
fig11 = go.Figure()
# Add a trace for each bucket
for bucket, values in data.items():
fig11.add_trace(go.Scatter(x=years, y=values, mode='lines', name=bucket))
# Update layout for better presentation
fig11.update_layout(
title='Perplexity Versus Buckets for Different Years',
xaxis_title='Year',
yaxis_title='Perplexity',
xaxis_tickangle=-45,
legend_title="Buckets",
)
Perplexity_Across_Different_Buckets_global_graph = fig11
##graph 2
# Data
data = {
"1-1": [17.410227605477868, 17.446573602753478,17.307221780905284,17.338525603992114,17.08551151136689,16.818363305107052,16.98821894111693, 17.125795647512877,16.573462144306383, 15.4293630385597],
"2-5": [16.11176217183986,16.14852530113782,16.297702171159543,15.960924352297502,16.187802102106698,16.474269837858706,15.936494557783181, 15.780419457145868,15.283018703313582, 14.608379914730168],
"6-10": [15.632757662414805,15.627408549576069,15.948641884223639,15.912187993988933,14.935072408852303,14.944741674400241,14.79960386342691,14.631430892394002, 14.378277745163881,14.118271697056592],
"11-100": [15.446116676532212,15.0055028132117,14.799690714225637,14.822102470001267,14.832038213200583,14.568394784374943,14.435682562274105,14.276477514399625, 14.0611924390084,13.880215644749589],
"101-1000": [16.716943171826703,15.565430373421485,14.935989931859659,14.778913482337416,14.508674264491997,14.690158822673334,14.58651834886038,14.337146941773641,13.9886330091318,13.767106666731275 ],
"1001-30000000": [18.156821563322765,17.314701050452452,16.09585768919658,15.428145290012955, 14.800605964649103, 15.990949424635108,15.869365567783806,15.872474774329305, 15.769421394877273, 15.05749135510839],
}
# Create a line plot for each bucket
# Years
years = ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"]
# Create the figure
fig22 = go.Figure()
# Add lines for each bucket
for bucket, perplexities in data.items():
fig22.add_trace(go.Scatter(x=years, y=perplexities, mode='lines+markers', name=bucket))
# Update layout
fig22.update_layout(
title="Perplexity Across Different Years",
xaxis_title="Year",
yaxis_title="Average Perplexity",
legend_title="Bucket (duplicate count range)"
)
# Show the figure
graph2222 = fig22
#graph 3 tbd
data = {
"2014": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [17.410227605477868, 16.28263447660928, 16.056605184079913, 15.822614148687798, 15.842634843649147, 15.720699070243016, 15.687223294726039, 15.607834732758393, 15.572091951204342, 15.475459290252376, 15.337665345612953, 15.33475421632639, 15.325861061422275, 15.476636737344972, 15.693804028233785, 15.689754199668954, 15.659926393713182, 15.59464057615171, 15.588725895678929, 15.552308157234252, 15.38315488135992, 15.3749391039699, 15.186437103290823, 15.179577016115116, 15.175359268463414, 15.326051392123386, 15.550365066676973, 15.46274973581214, 15.675382592723022, 15.6083647300616, 15.775496160899257, 15.619470488458068, 15.630267399750903, 15.687059334218864, 15.415897825337026, 15.499602281425519, 15.598025850718154, 15.628460503669615, 15.658570343618969, 15.787877514096849, 15.710944180881294, 15.552274945554545, 15.699932540053279, 15.727560356232173, 15.599824119717585, 15.683275006354283, 15.641738631258287, 15.80315709908002, 15.706620536337898, 15.700588878168745, 15.911432681730176, 15.550009275425229, 15.822384367996918, 16.105816904042662, 15.562383488563118, 15.963855835984134, 15.852621368738493, 15.941133570933058, 16.188290366801112, 15.70084365155994, 15.609990413956307, 15.673631920556218, 16.006611785209323, 15.786230274505419, 15.433452154301659, 15.617135397912477, 15.640107157600301, 15.675806627110681, 15.671948319822476, 16.068440880032057, 15.769336862872192, 16.40254172818583, 15.940476853009686, 16.09877983788286, 15.495609182160944, 15.712818514069026, 15.61898546436921, 15.692158946904128, 16.493172099511007, 15.783765491247193, 16.055784648916596, 16.334082795006267, 16.176010490897976, 15.630577127947536, 15.905029905131835, 16.610640775886303, 15.245514025399112, 16.28252696514428, 15.435644188406563, 15.888062835224325, 16.250276704907034, 16.054194778686796, 16.620639801236162, 16.102213595669074, 16.09682778567417, 15.881305605266526, 16.217666050845356, 15.886905671039385, 16.420120825444208, 16.575208311709837, 16.57735734574608, 16.186575145468233, 16.043253935667327, 16.63513328173465, 16.39894567786065, 16.41214937220052, 16.493426793298827, 15.9907685927303, 16.340040345074534, 16.951414035127105, 15.885674447160902, 16.410931308490415, 15.964154315977636, 16.810589683350447, 16.745778707293876, 16.468627893278832, 16.138744388702552, 16.407068111214684, 16.69176851966938, 16.324663512055274, 16.433577086199467, 16.434498347983276, 16.70257568394254, 18.747662848672356, 16.321669513149416, 16.69707440155245, 16.900596553383878, 16.68130890408306, 16.59473760593977, 16.54783975654349, 16.88654672752656, 16.078918331814624, 16.299820079993204, 16.373797255734377, 16.866705899661024, 16.397749521656102, 15.963898354324714, 16.82397059101694, 15.93018673258056, 16.98101514795396, 16.159948488588498, 16.726848882847232, 17.07683842070863, 16.113967724590644, 16.15130250991399, 16.80200457395006, 16.497186754611253, 16.666948876534608, 16.27533407301657, 16.308682326270063, 16.49999383144354, 16.359445800006256, 15.96150693135751, 16.60238027701047, 16.852103553279054, 16.521323558607705, 16.892194162833896, 15.693912585511482, 16.941903323105247, 16.480018831423866, 15.994720828335334, 19.96982983642109, 16.5613669780375, 16.410472896702814, 16.930635781928018, 17.307088122382734, 17.141450875814638, 16.793262685672637, 16.898963500457878, 16.034046523941534, 16.535173078962604, 15.623283937530607, 16.9146472987719, 16.710942224491752, 16.986982069138335, 16.094316754584177, 16.828775635709547, 16.087671276732564, 15.85332219694136, 16.48892512748128, 15.947276977857264, 17.071060205585102, 17.024065382461824, 15.924022369577948, 15.155645181021022, 19.43284882900329, 18.262079233670903, 16.72008178909451, 16.191840443840587, 17.202976578718893, 18.073639551374267, 16.211906986032727, 16.893893336751606, 16.459697938511802, 16.340211536130877, 17.323792190608398, 16.166587611972542, 17.10118411108414, 16.87592915776603, 16.22000303371821, 17.099521471855354, 16.65188809044026, 15.439452520219506, 17.1238180228351, 16.822849013604262, 16.573524603379, 17.943366953648695, 18.61078665129674, 16.781687468016873, 16.277476841130934, 15.656708089753856, 16.93898908638033, 17.165185636822365, 16.88121672323756, 16.662421334264874, 16.351884226195278, 16.409706698188405, 17.36934322952571, 16.42350307052468, 16.644262788006284, 18.645487431486863, 17.45592775934621, 16.58861831024693, 17.826687228059075, 17.717259497674252, 16.173776963074275, 17.81471375669573, 17.043108559597915, 17.447724642873848, 17.245380090633933, 17.159851613935718, 17.06408636418627, 17.636831200319357, 17.226401140951793, 16.89171092276326, 17.27705035910921, 16.42925715421899, 17.297253521528557, 17.152355698826447, 17.673683744959348, 18.04475478619425, 16.737975421424565, 16.86577082453459, 16.863767158267972, 16.384443285083982, 16.461263048130785, 17.02229949930192, 17.101654001031108, 17.356582073600375, 16.344481856681604, 17.17676991586537, 17.185069687958347, 17.56978076611228, 17.438405238494422, 16.801320242413205, 17.283593618974137, 15.979660333719643, 17.530455106750154, 16.192472201610578, 17.392028244723697, 17.502518627885713, 17.407844930629604, 16.696324269027805, 16.03847705843595, 16.23747483686068, 18.737873580931968, 17.86589992376309, 17.25159517234638, 15.618977309780984, 17.21762645376281, 16.869727185054728, 16.96866468612357, 17.412146418998862, 18.090503138314943, 15.752757796291071, 18.160108290669523, 16.495087053440795, 17.89917434478209, 16.704112151245884, 14.966161599960373, 18.271963637296526, 17.495885294624035, 16.876079860453665, 18.868793874875955, 17.23085150515865, 16.817181665750674, 17.24528354632844, 16.338842229657274, 14.433218936285867, 17.32290971310563, 17.641663765189666, 16.756405276984953, 18.144689315919752, 15.468462735891627, 14.740977777972642, 17.74261979627107, 17.1782285639448, 15.146783133278753, 17.987671541660372, 17.24769683193406],
},
"2015": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [17.446573602753478, 16.33448355873305, 16.00933847199168, 15.983039417794657, 15.85241889834333, 15.784779195636053, 15.703616129507466, 15.644552221919497, 15.514620657659218, 15.387526054739084, 15.334150663271437, 15.283029028158596, 15.16893769161261, 15.06255641892843, 14.993982766398053, 14.980830424168435, 14.894978523241926, 14.874134900735003, 14.918616109668594, 14.935196627981224, 14.982270030145886, 14.87532185377661, 14.923414109699833, 14.808884476234967, 14.853798330915781, 14.83634262877924, 14.884103172040687, 14.791729350119317, 14.841381880562261, 14.743489161054097, 14.749541904917374, 14.713088846373518, 14.736115099328263, 14.746879446029086, 14.713805840007282, 14.709588712899263, 14.577444316933803, 14.739053818392359, 14.762066899257567, 14.595290443430146, 14.691786246925215, 14.600135579482911, 14.647046245438082, 14.620775122740088, 14.617623649249394, 14.753907355407286, 14.76706893970498, 14.765124172688255, 14.712500515305928, 14.696874508068367, 14.81907059899775, 14.750912761553202, 14.625221044179284, 14.911875833497362, 14.725436890195013, 14.895866319885872, 14.659625760331911, 14.852191929623093, 14.819421246401733, 14.91638925652532, 14.88761718198507, 15.019561783059467, 14.926188679928243, 14.8976261202685, 14.814586514502857, 15.218634880057785, 14.987322499272901, 14.79324036398735, 14.987857051466115, 14.91859841901808, 15.125937006958523, 15.048624233676273, 15.006355658772083, 15.14372619927069, 14.81255875957223, 14.958579010235287, 15.174255696222813, 14.97779920274053, 14.886781555600182, 15.123245906261108, 15.262453421918734, 15.139709301302887, 15.34390238170429, 15.206255080716389, 15.134486108578406, 15.047922031259601, 14.803789104506233, 15.322960903420322, 15.192822749515004, 15.045035737995157, 15.214772119350238, 15.096963559125617, 15.068896811418327, 14.51649887948954, 14.982094339496212, 15.358409262348665, 15.19060977626869, 15.197210458056878, 14.903441009852047, 14.955607943792616, 14.99802494960245, 15.258130575745614, 15.5961206364953, 15.127040675697534, 15.460715059845283, 14.932271657615281, 15.332884367528639, 15.123204051950779, 15.24841813197201, 14.609549190518756, 15.496145584138791, 15.356557731249675, 14.94435638252105, 15.40016790545015, 15.755785011924306, 15.88238600117194, 15.670025630133424, 15.174842879119527, 15.112808149092393, 15.916588492185383, 15.175123852751197, 15.279512273042515, 15.847247739941714, 15.127126150755517, 15.591793878592481, 15.06298509221152, 16.003796703676716, 15.10754102021539, 15.962159399553459, 15.487914665938384, 17.122931139445832, 15.356883096594833, 16.106449129036644, 15.497583530145157, 14.81500158364873, 14.828355939887157, 15.236159256301672, 15.25841746072546, 15.345339692635477, 15.222124656846049, 14.878872707670828, 15.7900744642692, 14.958474140144684, 15.452926646855744, 15.809314812627504, 16.753943507801743, 16.50490961997181, 16.30289768513265, 15.582105870019463, 15.293213323151798, 16.173154239856846, 15.56344275477801, 15.003733846631661, 15.284441404625872, 15.310476987813113, 15.363259286181686, 15.378055808567508, 15.057319144633526, 15.196886386615455, 16.38508832789645, 15.533186110742182, 15.660575940541118, 14.999316634232597, 15.082654165851046, 15.140771984416322, 15.697283703599341, 16.502698997686203, 15.504693814089743, 15.547051916893142, 14.632280542436765, 16.129653356314194, 15.07420239746008, 14.978919677469474, 16.696916098163943, 14.885171910958753, 16.424189169593735, 16.63984522475825, 15.602313267179182, 15.380550660866582, 15.401771117577445, 15.231008081340729, 15.526480937690698, 15.253944535567081, 15.420602337399705, 15.088673361396923, 15.13791131493271, 17.170354799275547, 14.802302709465538, 15.391186800441876, 15.224508599986121, 15.356444086519367, 16.693016575301478, 17.090623668677193, 15.304231190267757, 15.148114513126695, 15.963496319760543, 15.44065314571742, 15.580535041960834, 16.842657665797365, 15.951080414141158, 15.529778723386256, 15.62919803763155, 15.313095703462354, 16.85564092895975, 16.326466103925515, 16.46689117444728, 15.577008697251697, 15.351489294062441, 16.14993653398667, 15.617966096026468, 15.877478213598732, 15.063997419778746, 15.779720026472049, 15.553359932608748, 15.416296077423834, 15.494589706245751, 15.788389820892599, 15.854571840070681, 15.411859733466283, 17.272376126374184, 14.978897070251108, 14.815726499166317, 15.05127178427838, 15.254732430093432, 15.48860976529979, 15.058258294814932, 15.33987120963303, 18.023076852959214, 18.225873662488258, 15.863931658322667, 16.427509106938373, 19.275509837094425, 15.81875941911799, 15.54111011827449, 16.677238943979567, 15.639847094789507, 15.220325425059306, 16.41161515359668, 15.488428081895368, 15.03498421775642, 15.487946653043347, 16.01984421565911, 14.57648295012637, 14.84545953400777, 17.609597747578352, 17.157577413896192, 18.679980348874565, 14.556018017450308, 16.196751121887516, 15.10185147463676, 17.686782120509207, 15.562463844274184, 15.888765556678129, 15.860827178562165, 15.848727089760024, 15.170566268590228, 14.808042574360089, 18.490268138761564, 15.45533884237719, 15.433460403959973, 17.254269870711596, 15.342865141549579, 15.601265739597746, 14.593595690549735, 14.997578247444377, 16.0050764933235, 15.787742433059544, 15.869933672425715, 18.193773757858533, 14.553107582993643, 19.98376615428642, 14.95451448606246, 15.072796337587288, 14.699652604291359, 14.655611734258843, 16.072567043889563, 16.210280944370062, 15.624767747252127, 15.324595170575053, 16.936626314427297, 15.656972252174022, 15.365396661405722, 16.056896958115832, 15.296691142785189, 14.525524866379902, 15.076000794224212, 14.40293229833154, 15.481724995978828, 15.007345860622067, 16.136110973861815, 15.732101759685424, 16.736637008621052, 16.026289361354852, 16.302622787180372, 14.341728063393646, 16.66822587109269, 15.760918873766236, 16.21117509050699, 15.824309655687308, 15.401576029240012],
},
"2016": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [17.307221780905284, 16.234776478792423, 16.30364088551167, 16.379029565763854, 16.52356312405983, 16.24530925560526, 16.006540792933116, 15.85403446105224, 15.723979893931466, 15.63501113221084, 15.581423241492276, 15.567203466817464, 15.467076541338761, 15.384256809950589, 15.217246561754829, 15.10033102057403, 14.983988497758792, 14.891815052698316, 14.778270674791566, 14.701723831957946, 14.62637352080993, 14.516481461285027, 14.50465541788953, 14.428207241225165, 14.37516921139166, 14.361626978901834, 14.490208181211544, 14.548160252144106, 14.598462844559366, 14.752690053910175, 14.828578155120072, 14.742911603952818, 14.773274548959739, 14.647794448552009, 14.56823005496042, 14.613763862920718, 14.426621123682969, 14.478844375622407, 14.422306783085949, 14.527778623598294, 14.325195633814634, 14.390594307260038, 14.364773158798116, 14.383213457600299, 14.35308212412287, 14.352372514800544, 14.201870671662768, 14.277748866799087, 14.312696383944079, 14.313891188907224, 14.329383264656686, 14.47149939181459, 14.491734262509468, 14.513431812957156, 14.588016261640757, 14.403651347510129, 14.51384158930121, 14.624577984096032, 14.822443028314837, 14.48737379308041, 14.425541898334243, 14.430122773766353, 14.388508890641424, 14.504527435519458, 14.464901503427619, 14.653700915470745, 14.595648024211519, 14.449564315780473, 14.612423755765175, 14.671255472629436, 14.523365635575571, 14.570864952164412, 14.675754875651336, 14.611781322204267, 14.50904332362948, 14.551067538526674, 14.396781112278433, 14.4996889940005, 14.75348433384515, 14.748574368311367, 14.682659515657313, 14.817868067283271, 14.66048427952218, 14.62898199025576, 14.667195610554206, 14.72678737366503, 14.792133972263503, 14.544303597718525, 14.693020091609378, 14.654447026029196, 14.703904432040945, 14.424298987064056, 14.938344051200023, 14.619739917906342, 14.565987744854835, 15.107383346624445, 14.511204728522042, 14.449450604819619, 14.60351580074054, 14.433500805057605, 14.743392142728267, 15.231768885000825, 14.761516121146009, 14.61165675226126, 14.90598336405985, 14.91175193989237, 14.564636821247571, 15.103038504218528, 14.478713406434574, 15.227275522759577, 15.022744873864598, 14.620219145961974, 14.785211033367963, 15.13012168013741, 14.966301178256803, 15.023857320232775, 14.932136164613826, 14.916861609698104, 14.89512418972303, 14.771309185194937, 14.629565522238666, 14.801613342132413, 15.031938958819314, 15.015627929689526, 15.169636442102666, 15.248843746873948, 14.5845960664532, 14.80060552408705, 14.686464454993288, 15.211243508451018, 14.843377415541585, 14.78139335553135, 14.709272565819346, 15.042772236679735, 14.901835278704146, 14.87732704967686, 15.110419431311994, 14.945782391612148, 14.77586496097264, 14.697465204514597, 15.018728840934191, 14.648390805578318, 14.503034231961104, 14.68954892015273, 14.82810870022996, 14.569718037154127, 14.572628356722591, 14.858948316160495, 14.556753268113512, 14.757877361048365, 14.611562311403345, 14.717578588265276, 14.733806351762832, 14.867930349202046, 14.708928870526954, 14.60690642587284, 15.14502452412242, 15.107548842832665, 14.415694833175626, 14.737446116732965, 15.01618490970902, 15.025735505545079, 15.015223374474092, 14.788751431936802, 14.86620257038334, 14.931136458043323, 15.740785615445478, 14.808267919803718, 14.972592668748439, 15.141946935844496, 15.18472280586112, 14.85580192562743, 14.590730129109179, 14.855881371809206, 15.078635844463975, 14.917158174494922, 14.950622357039615, 15.201539290162318, 14.82959828904692, 14.889714788370952, 14.988233657264535, 14.910959338958069, 14.682041728334324, 14.697007957600201, 14.841925030620626, 14.895353098337022, 14.902095228260611, 15.086857166255568, 15.215767403635036, 15.56933817584006, 15.024896525609627, 15.167838031837093, 14.94121712496779, 15.024931497552117, 14.492560629538843, 14.741020592228535, 14.507200801687778, 15.458663873044172, 14.316896863535968, 14.609290807064818, 15.027364270163478, 14.936512288174443, 15.253954037048475, 14.510609936444846, 15.916676128127982, 14.656533951948624, 15.345831998830816, 14.254683784179212, 15.10289649943302, 15.38091692240808, 15.141691037390665, 15.165877037351509, 15.199873038454554, 15.16527646186345, 14.76968338527267, 14.954832100582504, 14.836598589446387, 15.110291187450528, 14.641863100383437, 14.937350641186566, 14.841399293047491, 15.467068880425895, 14.665284963662575, 14.817881002793591, 14.598636006589858, 14.684164028049974, 15.14425828783176, 14.422497163470021, 14.796764157649553, 14.744954865597302, 15.404677012769369, 14.986457456438755, 14.81969445960239, 13.992963378364456, 15.195532009187653, 14.845520034088448, 14.004280102433553, 15.041711235754534, 15.02108593809691, 14.738176887035477, 14.69767387768106, 16.03853288392953, 15.08406239514085, 15.177005242060092, 14.983154630158717, 14.728424188043775, 14.71519779072297, 14.726374986516426, 15.094235154391239, 15.029036096533034, 14.854841251155284, 14.885824338461951, 15.048620593479637, 14.83695301506028, 15.690625629638612, 15.373086697008327, 14.653274585194445, 14.857267781088177, 15.085373410780127, 15.95265927867797, 14.252191466013802, 15.461625044517037, 15.424916495835996, 15.135633081682494, 14.924146425445693, 15.17655062132758, 14.146194759260652, 14.877595658709714, 14.826823556584703, 14.934354978925048, 14.860723131282562, 14.902811748406107, 14.269230470566441, 15.443474729284654, 15.51211361992304, 14.931369047553755, 15.251102680088037, 16.333014054316223, 15.348153571473588, 14.994998859814807, 15.02055006842947, 14.550322529281782, 16.747685377509097, 14.61405061842175, 15.271423606471101, 14.913829430481542, 14.942304143822593, 14.880191844218682, 15.205724737725303, 14.508432092262984, 14.94832514929929, 15.191642071801384, 15.104062600091243, 14.367253080997536, 14.820283025758636, 14.902115518264766, 14.976713453340755, 14.53661719522025, 14.57269990405486, 14.383623568744957],
},
"2017": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [17.338525603992114, 16.203745269249215, 15.743623454352441, 15.734634467146362, 15.589952534971571, 15.674756753821354, 15.809161959808193, 15.984202107160641, 16.4241410848677, 15.748360557975762, 15.503652893791108, 15.48276933725104, 15.359691775186452, 15.265874486753685, 15.27002791496366, 15.30935492406096, 15.176258134181692, 15.148949478936686, 15.028798289991284, 14.90744299336548, 14.820689888178931, 14.730663559534568, 14.698074187272612, 14.682410624091638, 14.583179371506233, 14.53150003082502, 14.53885706635866, 14.532888163095201, 14.459774520912301, 14.477194920807293, 14.451738865284145, 14.434821354142883, 14.41092827247155, 14.399897943713333, 14.369944479331494, 14.394540607240975, 14.421030541126406, 14.402463627156687, 14.402775919237724, 14.419437640759872, 14.367993463310803, 14.500451281790058, 14.412866100031703, 14.462751191430899, 14.406691066470577, 14.39351237812279, 14.42370247965012, 14.394195683486142, 14.367637888631284, 14.317040785476035, 14.384165211134619, 14.342293061646123, 14.256587327198664, 14.255209117053106, 14.161250551154946, 14.182886130471418, 14.337296431014249, 14.250283553686213, 14.315223610910822, 14.29277934588697, 14.259173667263372, 14.309373028552786, 14.26932675271818, 14.25296041254812, 14.297957286484179, 14.291230396774537, 14.3288422595368, 14.391208183310448, 14.508950496368158, 14.369923015151878, 14.578679879400276, 14.643292099792278, 14.503639422745408, 14.395277634894851, 14.617563409720901, 14.320809204278323, 14.326863770514343, 14.492267481694547, 14.53833400544276, 14.479261811733661, 14.390689624911246, 14.559188164442414, 14.347725987723816, 14.39174864710453, 14.532684077312041, 14.477688969937942, 14.499122225226834, 14.38917045391089, 14.393872052024337, 14.353218381093932, 14.470166967628375, 14.369508699574117, 14.419008254975036, 14.542500865279285, 14.560838318132463, 14.58058785889303, 14.607055203147862, 14.43193144016228, 14.829687836802265, 14.449026644037072, 14.48998003947198, 14.611917269679976, 14.599098659379221, 14.70752026139727, 14.702225056022963, 14.456101785047814, 14.653484092796994, 14.70689023296051, 14.435274179143056, 14.532231364945941, 14.521113153182691, 14.326819931888322, 14.635369987417324, 14.603509022887518, 14.682676839692993, 14.577873452861347, 14.457069909806911, 14.57983212015869, 14.439574851221634, 14.56952208401313, 14.481436757921992, 14.605696638301199, 14.663586360418082, 14.762704505619975, 14.696344599118095, 15.058978095342402, 14.679614275191193, 14.782876796374236, 14.4329249104854, 14.56553422568721, 14.83391429316557, 14.748817492666898, 14.703605394383715, 14.609897874420477, 14.616378288322748, 14.77832918471473, 14.479572959548198, 14.839584695885266, 15.073442936116525, 14.453779301176265, 14.823911857453854, 14.660256560107975, 14.665502643560991, 14.749573922593015, 14.71023539853617, 14.75193393865211, 14.62104590642465, 14.605726048725387, 15.23915168638822, 14.595007415190265, 15.036796604259008, 14.69937457019285, 14.606595698619232, 14.406195191711271, 14.844717776160179, 14.637451403580533, 14.73051115891568, 14.524288854877469, 14.917830094416082, 14.614947053211404, 14.481609856640228, 14.655834471577693, 14.227499362972685, 14.486019268378959, 14.601624977436405, 14.75459491314579, 14.595313529419624, 14.72509719938368, 14.716095939861956, 15.042036469594322, 14.822071159312484, 14.704056751960753, 14.814756972832775, 14.660566475923453, 15.32705108123779, 14.811430469464787, 14.753795298335223, 14.787537787393061, 14.726258599649885, 14.888144523578852, 14.578666188666858, 15.48832732403903, 14.893041433317489, 14.842996804540338, 14.719123031667849, 14.951437200499774, 14.413844979385376, 14.542864925725786, 14.809384952949387, 14.950312336308098, 15.033195874525896, 14.9942146762989, 14.72594276483278, 14.818267391408009, 14.833977053560968, 14.935809475323842, 15.264943149866932, 14.778009547157467, 14.870954635676403, 14.959498334141584, 15.08716336448507, 14.520830803617603, 14.952029182593325, 15.087540174436855, 15.23470807359972, 15.410612858318652, 15.053440134797949, 14.721241033320792, 14.965750225636034, 15.41726206267645, 14.981004593158513, 14.753634737522535, 14.864483127379483, 14.711506518090479, 14.744846795714427, 14.579622519532153, 15.33109505629075, 14.502654549125777, 15.075854816302078, 14.404490632309455, 14.583624500642594, 14.812122832723535, 15.083552248412369, 14.89488400720679, 14.80901764184227, 15.377589395843788, 14.607655632691126, 14.661681978639534, 14.94182918388782, 14.524723199136687, 16.378308656806624, 14.744146709196684, 14.568067658615197, 15.20825130391414, 15.43766325471979, 15.377202599450115, 14.788270335652301, 14.972957705527788, 15.569618923359307, 15.035417167620839, 15.716903651264683, 14.861895451311895, 15.273852366705366, 14.823991172300325, 14.586889078548603, 14.993219393776187, 14.705643220833624, 14.813598650853102, 14.579683191023557, 15.09572503306876, 15.249413549876413, 15.018545433789917, 15.001407309408743, 15.266611462536407, 15.295055951617993, 14.767761903822773, 15.206324462510874, 15.559532265914733, 14.785568626693545, 15.113806291221003, 14.790114427375459, 15.096261371426904, 14.53563755791196, 15.332730200170944, 14.73449338379727, 14.383623969590408, 15.191473711664047, 14.611626122188666, 15.499340732138753, 14.67712043132989, 15.282937735532999, 15.429914403297502, 15.373442513947067, 15.905383903260773, 15.234888147062103, 14.688116267490793, 14.465993946950508, 15.165784388673215, 14.841821728155802, 14.953859599973894, 15.469443331628613, 14.771122101766585, 15.047230872308521, 15.123684605453414, 15.176629987437977, 14.98265529965959, 14.678296918807122, 14.835686619841164, 15.2011887342145, 14.216768660472994, 15.544884200637565, 14.808085893691599, 16.411735465807038, 14.955775618549108, 15.476155856267278, 14.957565845543835, 16.02528738696533, 15.032999674760873, 14.633066583922867, 15.231517143471306],
},
"2018": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [17.08551151136689, 17.017409528265063, 16.473327146320948, 15.489607077583976, 14.99999142269165, 14.91941818722109, 14.934676916202214, 14.905168583562467, 14.889779862855368, 15.101460828368536, 15.277767914352683, 15.372562426056486, 15.237912427608558, 15.144916550505076, 15.097228076989598, 15.027981638522666, 15.041650504633653, 15.039315955294928, 15.079673813248638, 15.01559865162396, 14.86827687590184, 15.035103083818093, 14.979396295193135, 15.004577409363677, 14.868860388977389, 14.706868255708677, 14.682132861614424, 14.58608796051945, 14.583801121238027, 14.602760512229612, 14.635499944457107, 14.54985476009246, 14.517388362803912, 14.424612593267815, 14.356443505732349, 14.320246164742109, 14.32942869403736, 14.312540328006811, 14.285359354029762, 14.23664592294733, 14.2216004270453, 14.26761556180727, 14.272762101599167, 14.2435412514733, 14.179271594687851, 14.197076962309092, 14.156703101832047, 14.160208286167808, 14.175229746671393, 14.146635777103596, 14.119723989874416, 14.166581376841608, 14.11063165634931, 14.158191428075831, 14.123590757983367, 14.084318666837452, 14.037386481477629, 14.052929271479353, 13.999064575195867, 14.029998213491039, 14.085681596698128, 14.115590275368502, 14.057376003054532, 13.95691072215424, 14.04820478262793, 14.006810938903278, 14.16821288854753, 14.046307574280926, 14.157018440960517, 14.068759463432748, 14.009289321906962, 14.101583690268125, 14.084153022450309, 14.128629997577798, 14.054478824631365, 13.99789759007014, 14.029294022700793, 14.120556559672547, 14.06850831154868, 14.193091716662481, 14.111214488209695, 14.057745125547271, 14.163744339369122, 14.203482287973332, 14.084023869280376, 14.087059883933515, 14.159595333199121, 14.250950032773568, 14.044348353827543, 14.139417225867433, 14.388449841133475, 14.086184279954336, 14.13927865138474, 14.103454229226045, 14.17936753834711, 13.997130775289959, 14.175686386038445, 14.040504409332115, 14.276567944025343, 14.130128330365181, 14.157628882251041, 14.118883833248233, 14.21411018421439, 14.158315748739875, 14.374685589752955, 14.205982942155632, 14.07231131157327, 14.148826256775408, 14.0463063135345, 14.29559105022842, 14.699947308651737, 14.224844793204428, 14.270933778435285, 14.45803225547581, 14.982456953901945, 14.31781012375104, 14.274597726232665, 14.294033160896166, 14.223513900945731, 14.384520341367507, 14.463819877539144, 14.488171518604748, 13.979611784952175, 14.272705963111509, 14.410017825884983, 14.343266018381327, 14.323089655828728, 14.124110925918979, 14.344805655428692, 14.288532389553106, 14.146709166565785, 14.43993740768601, 14.484295925445798, 14.359979583505035, 14.390022354485474, 14.481346450985473, 14.497645969227946, 14.73482258133124, 14.421206373719997, 14.557374979130687, 14.389218845252664, 13.921585899547281, 14.524009855576425, 14.404591364406048, 14.445618911203617, 14.53246479076758, 14.695596471265455, 14.541356275372726, 14.720750266017621, 14.733047385457983, 14.399671256473548, 14.730309069788058, 14.573360150553853, 14.829219177535798, 14.616642710080793, 14.553439665610382, 14.585681016503, 14.696499921083584, 14.254707775168475, 14.532110701362317, 14.611323085768618, 14.543545533821455, 14.594876336705177, 14.569194658920264, 14.482698701837924, 14.694438504643307, 14.335206265450186, 14.548170393027661, 14.595343524718512, 14.313075747032116, 14.419399996099525, 14.622371217096244, 14.445095461274985, 14.417828340402506, 14.590657959466622, 14.290907126746568, 14.537614442655705, 14.343957392622876, 14.35706953914797, 14.398020676700606, 14.22368723103676, 14.437905951752546, 14.674447600091657, 14.75625998516921, 15.579670438788382, 15.065195933489692, 14.477353129283996, 14.340181955802624, 14.649093255070694, 14.22899776464687, 14.797860784901735, 14.175241156618343, 15.08660683229495, 14.54174486952973, 14.51034016113076, 14.711416365809932, 14.917069256432894, 14.413902903342057, 14.51579671870371, 14.363158781681612, 15.156257729551365, 14.351562381589106, 14.631626094733827, 14.54160309139232, 14.958644551508241, 14.328040536196967, 14.836468602447896, 14.618058058761168, 14.687128172180751, 14.585715117544657, 14.758648910227583, 14.619303844564032, 15.16452152995779, 14.966621742960358, 14.500593602710854, 14.860684515921202, 14.735198796861527, 14.7054797386434, 14.656783902436345, 14.756265260740637, 14.151289774685646, 14.589083808577307, 14.597878649264747, 14.617067130952734, 14.810381739372293, 14.723288507154296, 15.169244896607879, 15.222911100290771, 14.516473252534535, 14.654221879404016, 14.597901258041633, 14.776648468745911, 14.861584739898804, 15.23897106330057, 14.60966370623957, 14.873671194846414, 14.93612904100658, 15.015972197391466, 14.683478811048316, 14.826474923051949, 14.99467004706795, 14.801534903481752, 14.766829811699983, 15.0966363430717, 14.914861100323844, 15.183919855400513, 14.245321211762812, 14.190354276751055, 14.766879254304731, 14.142545990111227, 15.374573934831558, 14.859978645365866, 15.296454128235439, 15.005596202148249, 14.744984863401601, 14.34643807720319, 14.475034908089677, 14.709114468534864, 14.736943186983439, 14.42073814550631, 14.506059499704438, 14.473742463397024, 14.618391200324082, 14.589891533142023, 14.997001165633769, 14.795483671635305, 14.27848789177751, 15.138255578583978, 14.834263127695507, 14.771238943514723, 14.747213748240789, 14.798733124706626, 14.532918351260932, 14.950583102776458, 15.552259399468454, 15.12783446905641, 15.215579477179926, 14.471794830430369, 14.740651466871597, 15.144502305980348, 14.875364956591815, 14.443567163521013, 14.875743067972856, 15.129241877637964, 15.3090759550837, 14.768736872364462, 15.1841234624018, 14.51734231534217, 15.036041111737525, 14.731338820770624, 15.261412313678711, 14.295315456490005, 14.99224943887244, 15.098297215130652, 14.739582684146058, 15.40461423557035, 14.505097386511684, 15.038694095563027, 14.494821021436477, 15.21965220393292],
},
"2019": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [16.818363305107052, 16.9384196002684, 16.373544163301144, 15.915842635402715, 15.495413806206251, 15.21813749917199, 14.981956303655137, 14.838254291964295, 14.76689313041234, 14.717622741724327, 14.652035688314417, 14.675703419603789, 14.676956961485203, 14.68153300251823, 14.68379760210929, 14.657486268060575, 14.676872680734599, 14.660069429839945, 14.634235874675083, 14.594851416980822, 14.532981693881329, 14.518467506154115, 14.498061602754063, 14.50359008364371, 14.499692504768717, 14.497089885925234, 14.346527214520817, 14.375469479863991, 14.36217746815957, 14.369260433451691, 14.567961179021168, 14.592515669479713, 14.582806082614281, 14.427714905350035, 14.28349203614485, 14.244431746998693, 14.17335303845642, 14.13413706921266, 14.1704889894961, 14.210070752006516, 14.164155842322359, 14.241401877344122, 14.259333116642207, 14.26209597790733, 14.233323759820998, 14.27527708370166, 14.235957127875976, 14.260371069971875, 14.251584104018576, 14.246656629527484, 14.364605885916907, 14.292805105377587, 14.199796446635496, 14.411856208959865, 14.406722253424034, 14.251555504989668, 14.317774155701631, 14.272654395870804, 14.185324746396732, 14.085700290006402, 14.222972725734655, 14.00716838577262, 14.190132352105405, 14.233049849028568, 14.284342014396278, 14.137968659408836, 14.275066624183827, 14.392659025077748, 14.140964316097964, 14.259717421340069, 14.342471907094104, 14.17383011709637, 14.013535232449604, 14.327288484160523, 14.139968440566038, 14.395982360090636, 14.207331288389051, 14.140194363686335, 14.204859886070256, 14.432860215814515, 13.572486504393169, 14.252771725460635, 14.095564630892566, 14.363579419734007, 14.418378787697504, 14.26376709920845, 14.351803131539878, 14.38357383763439, 14.40615109787678, 14.281738198765106, 14.18807550562207, 13.869380756576668, 14.36346954737725, 14.276972917585828, 14.3604303608435, 15.188735964867677, 14.792139152181454, 15.098762493319898, 14.87784455761382, 13.884399310877278, 13.859563871251646, 13.836993020011077, 14.051264784446204, 14.323106670622142, 14.514366953736504, 14.516665443761871, 14.750357301218527, 14.199680753932574, 14.416337292709834, 14.857635888054926, 14.384030403976343, 14.902915738566662, 14.323945972002745, 14.466001050980731, 14.354049612607561, 14.229693987628325, 14.710493178618231, 14.548242314603701, 14.497546848597976, 14.356404424959749, 14.53530968254845, 14.27400897380326, 14.332690564745262, 14.472114483414982, 14.346963017872124, 14.735745182840818, 14.410660190079582, 14.661404983131112, 14.5679107208867, 14.78705195945152, 14.284570571196062, 14.450880101798376, 14.40282201981158, 14.421063475750937, 13.694975403417804, 14.134743853086364, 14.431594417898266, 14.452930007412851, 14.466336558468972, 14.192810846247854, 14.382971433599055, 14.60549520534943, 13.857005504326008, 14.44726389661245, 15.882433447671191, 14.931474931358919, 14.660164271592702, 14.593546234799078, 14.27183471486294, 15.066894098641765, 14.536617568488758, 15.117366296649658, 14.56638968512836, 14.750528595558201, 14.468849142258842, 14.896127642308747, 15.019204503159425, 14.706498731150011, 14.627792723676187, 14.742346111733225, 14.60481349294382, 14.97509955271017, 14.336567817167849, 14.677503440539182, 15.218089838817582, 15.402562958356604, 14.187143176248465, 14.78658600408109, 14.794912292258529, 14.609724199324852, 14.958991912036334, 14.209041084136771, 14.983361291635962, 14.341997698680517, 14.665256016769371, 14.761917546948164, 14.535832785640112, 14.22107360427565, 14.532382759740454, 14.80442504890915, 15.001451110568746, 14.666429595146187, 15.040283093745517, 14.830024662429224, 15.178689445578676, 14.74487535109334, 14.76226189171742, 14.216006491892387, 15.041870740922365, 14.735238928256866, 15.064160946520538, 14.187571631865708, 13.952757907461969, 14.671414201788117, 15.254778187750826, 15.00803314937916, 15.101744169852097, 14.597755929912422, 15.516273859063304, 14.859096733328412, 15.156726701434254, 14.83635437461029, 15.484892021360674, 14.853687890573905, 14.452850335271902, 14.902735468954816, 15.314779072773824, 14.201654493889864, 14.733634310314255, 14.603323437807163, 14.316334447980559, 15.651563635776926, 14.5428461114861, 15.634935103903274, 15.450083839772201, 14.81805887551945, 15.321542090540696, 14.953636433367153, 14.61533324387713, 14.856432629267461, 14.497654236558567, 15.19369187303432, 14.084670634034236, 14.559689946051137, 14.422837261653042, 15.326590541934966, 14.815694783570903, 16.11336335053699, 14.477894981937279, 14.658815929384009, 13.94824345787607, 15.091958715074714, 14.546801580697949, 14.499229190729503, 15.13412159656476, 14.168547246908107, 15.30210597311838, 14.828094825752267, 15.426011740409116, 15.158619144016168, 14.88084924072268, 15.060043720557001, 14.930340549832115, 14.868785091552331, 14.976821021905435, 14.858914068549007, 15.705812291184321, 15.290013367208434, 14.593670122497366, 14.312903147417623, 15.407973867347854, 14.846711542803762, 14.297227950036165, 15.019140596498042, 15.089245438803882, 14.914069858294754, 14.806508542112516, 15.334831231998987, 15.025878044500283, 14.919244367134333, 14.49300092717289, 14.737776979953303, 14.164272143865894, 14.822269643198338, 15.38840525416425, 14.894979478886672, 15.22223690619034, 14.327600485303089, 15.044064869948848, 13.84937939564519, 14.013057380266105, 14.972762100285964, 15.169941531740305, 15.024904641298892, 15.266379765285302, 15.12116347813683, 15.663150784684255, 15.289208121912026, 14.851834463840662, 14.098011319425714, 14.820968406564596, 14.432522049087067, 14.951442280106699, 15.347772241491882, 14.965616703639899, 14.737050989961581, 14.83879871083048, 14.180030416603776, 14.456052122204758, 14.706780316608707, 14.623600289797057, 14.122283891907626, 14.45783579937423, 13.954283695642895, 15.33804388915092, 15.326367452094553, 14.104709635258217, 14.572119980695652, 15.97127672565096, 14.502429220203572],
},
"2020": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [16.98821894111693, 16.370513604792954, 15.5962992453352, 15.34457724194128, 15.145027410230577, 14.961204778914126, 14.81681914711489, 14.72701624334705, 14.705103953556968, 14.659639224347323, 14.585941681915887, 14.616406148288082, 14.54489696103787, 14.500602728666788, 14.49438912322633, 14.476614809453949, 14.445764024706827, 14.451334081082246, 14.412458237106039, 14.453183197616022, 14.419415146317077, 14.375727605781263, 14.353189940035962, 14.386770485296116, 14.391023922379683, 14.369940063772127, 14.316986079363922, 14.28751116108904, 14.37695278550541, 14.376602719972492, 14.316083429115322, 14.412605409200454, 14.346012877362117, 14.194463592710365, 14.209962572796991, 14.30638291999527, 14.140715686001009, 14.11032354096776, 14.08932388255865, 14.163596362182776, 14.015274970719, 14.035500523445947, 14.081064777083556, 14.059262469872834, 14.098393089021668, 14.127387756897626, 14.177925151723068, 14.196369527393575, 14.110546228688507, 14.156041170771427, 14.292628768248916, 14.133254062565298, 14.076060255602068, 14.128683267299975, 14.100690560366042, 14.300641698843162, 14.189416892766634, 14.110541486570694, 14.042105925243993, 14.209573244412097, 14.09984824336511, 14.187626009998954, 13.9891768631806, 14.085976898385344, 14.110584718850642, 14.127695090137179, 14.047560139049365, 14.164531774421318, 14.243170489139297, 14.18711399265343, 14.252306645902003, 14.270660364725599, 14.018742179693277, 14.203152728170489, 14.11114000260732, 14.095189622320586, 14.175733016796135, 14.12640528525355, 14.1476195208239, 14.250949019383489, 14.28946911703642, 14.137797265291285, 14.124816493364671, 14.053800012469745, 14.257309666842751, 14.43422940581773, 14.202604513480152, 14.163614860908242, 14.285196582476628, 14.308994633625163, 14.673692934316794, 14.25088456318874, 14.19435275862046, 14.30723125536449, 14.042647691269732, 14.209698854879502, 14.573048625431696, 14.2512731159336, 14.119382008703974, 13.989892488209229, 14.42870954417215, 14.378769414148628, 14.498830747763531, 14.1687405789002, 14.352354928133906, 14.482755712427602, 14.540381004714042, 14.082061245171214, 14.308879059107138, 14.64413320939842, 14.55672975225543, 14.597762574178923, 14.653181628225957, 14.566651933285437, 14.396808171088576, 14.254814519309747, 14.652776690373177, 14.312076086663604, 14.297837324665121, 14.478635173676405, 14.766128492445645, 14.74281817130926, 14.050189687362222, 15.071164526876904, 14.089101804268344, 14.377873623198521, 14.428162387206788, 14.06090101738822, 14.73211046682085, 14.397391200359385, 14.969796825255916, 14.21181077427364, 13.953829520831896, 14.421216722135016, 14.244561500812402, 14.659544345732002, 14.30380214400257, 14.346494448420565, 14.643921909340355, 14.676353661427488, 14.582860513955845, 14.380169502805304, 14.445242737706893, 14.14426212786935, 14.487235987583478, 14.434474674750891, 14.935409896690082, 14.51557296420941, 14.533649625966051, 15.056389509181635, 14.369417913972073, 14.57519932507594, 14.529862959650039, 14.520311131600797, 14.751264602070773, 14.52303253663038, 14.034007982076067, 14.874614869845297, 14.893296491574656, 14.847032460077651, 14.048106705033495, 14.7857781889984, 14.394545504262544, 14.92682959969511, 14.421822402770585, 14.738597193898885, 14.81863405043246, 14.719529547006385, 14.49174656953006, 14.579206559493965, 14.496080113819792, 14.683939444539357, 15.178248516935348, 14.781161924065806, 14.690954262415783, 14.592626398646784, 14.620818563833607, 14.792313058316815, 15.04026046902646, 15.271165416222335, 13.633974549799833, 14.726471734141892, 15.12571733970632, 15.347289709822073, 15.20887032383406, 15.38889560356774, 14.47088499847924, 15.28835971083243, 15.683200945016656, 14.130414367622848, 14.958103273266774, 13.882635466123684, 14.261885168592414, 14.952622454125132, 15.121191440102477, 14.218448105992932, 14.04778667497245, 14.282879315894712, 14.388023835193884, 14.943734425279825, 14.573802965069763, 14.59533592628099, 14.137133673783744, 15.740756377040112, 14.738197920651777, 14.401407660047331, 14.678492445195307, 15.694388369476837, 14.970617129108886, 14.790890050526873, 14.081049702727105, 15.089240160980136, 14.973541692006656, 17.363773035244215, 14.30187824577634, 14.467930386802934, 14.516902572723097, 15.329479047198038, 14.624015710976884, 14.63473539904464, 14.373641210092153, 14.166605449430495, 13.783011574782721, 14.263544216558952, 14.862460470452541, 14.727532380698701, 14.531637756291413, 14.822949072623675, 13.786841833050836, 15.468646905878378, 13.687744658367365, 15.402759853996804, 14.554763109617756, 14.869860145474584, 14.696348658200264, 15.053898516516293, 15.585187607593465, 15.563313816410492, 14.67170366276461, 14.147429693845183, 15.075370337957708, 14.54650295647481, 15.179010783244516, 15.409213810776961, 15.515504225457606, 15.08444738015429, 14.28164868574861, 14.795723222168206, 14.494017381983374, 15.086575424633287, 14.5004735623822, 14.690241855908853, 15.16616264517412, 14.420163065055343, 14.645301486362538, 14.703220301962068, 14.849238046919403, 15.650596675034029, 14.632994392359596, 14.656751152341625, 13.42732972397951, 14.559955525204266, 13.86922509967631, 14.970856644090627, 14.777476492577463, 16.920064964091267, 13.862551797128589, 14.341017840554162, 15.05552539530507, 14.510146539196526, 14.82627197246354, 14.217575200807142, 14.558965165319933, 14.989795407670229, 14.864206988315356, 14.070177677455412, 14.591439215337656, 14.427307406625893, 14.658924923576608, 14.552212819309558, 14.496153901814848, 13.465088583786082, 15.279577878202042, 14.250419569473493, 16.682037909981887, 15.002301747811199, 14.982256666571692, 14.731409709159067, 15.049455411763278, 14.047122405829297, 16.130648201285517, 14.378254782238285, 13.578630316558009, 14.434082205270641, 14.021898725941734, 14.670519491759856, 14.453798843745222, 14.17311154064359, 14.402414278988672, 14.005273719141623],
},
"2021": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [17.125795647512877, 16.167745862518196, 15.628246706160752, 15.259120368931182, 14.926562361064429, 14.772507696160567, 14.648438494926047, 14.588138177135876, 14.54822196472763, 14.475861347759562, 14.460319047237233, 14.442843207466103, 14.4038296343842, 14.394511790461651, 14.348367943326428, 14.32853776014437, 14.327587327392449, 14.283804275698357, 14.259508539703859, 14.302287805393696, 14.282305711120337, 14.263298819721763, 14.285400767896524, 14.264218208695306, 14.202014100127334, 14.20328112967117, 14.216620715709263, 14.116703246320014, 14.113002574980353, 14.19797659791998, 14.184475437460227, 14.17140586394928, 14.153367169282923, 14.105488824436396, 13.974118638251884, 13.961962352804841, 13.941713929826346, 13.905724479598716, 14.00303964026138, 13.894208584015068, 13.888198442124644, 13.910217270859699, 13.958348976096786, 13.996486767640276, 13.952433116756215, 13.881485908164867, 13.841327704307004, 14.010233855893194, 13.901290765892576, 13.964782990834575, 13.947668807360214, 14.002108660702943, 14.100236293569111, 13.913514059265415, 14.008878934326711, 14.1215861114549, 14.166863866092848, 14.060411692695627, 14.091507958506499, 14.042020007415392, 13.933502120084123, 13.976718637677976, 14.110112398986368, 13.946827178207108, 13.92074063569153, 13.719143640395481, 13.899877269504755, 14.032231641092489, 13.90552849121535, 14.030796627867813, 14.04078405713417, 13.835538213150517, 13.887683094620403, 13.922253279554539, 14.033362121502554, 14.003644608750475, 13.973479075909129, 13.912907524482925, 14.112683977468198, 14.03643922189136, 13.96315674414098, 13.830193463808813, 14.114193305067333, 14.054674185637106, 13.85320381041386, 14.168994234583005, 13.976630129998245, 14.09168283178549, 14.1360857562945, 13.930594160736613, 13.951043088939633, 13.829115383583336, 13.885756631493077, 14.163375698423827, 13.91575038053925, 13.558089809232264, 13.73735035053235, 13.913573293359047, 14.044695829875689, 13.640779071271522, 14.018409931371455, 14.228975095827632, 13.996144832956702, 14.189387423270379, 14.226768069678103, 14.174632825996992, 14.164681909355574, 14.183902661242401, 14.218647655424025, 14.427719491219426, 14.120208529383286, 14.106984808719545, 13.908662457927276, 14.473311879038915, 14.238014829218347, 13.934301621528302, 14.102096730568954, 13.909338128391484, 13.942206839197462, 14.181340588754892, 13.948523943371205, 13.972790388999817, 14.242211417447482, 14.420550819515553, 14.252479889698895, 14.383110307644158, 13.773742200312293, 13.743677908920969, 14.123502462283474, 13.900535882002238, 14.227020639667176, 14.06790568544232, 14.145869780275154, 14.19630099932665, 14.526115896114717, 14.30476007895747, 14.278952790980613, 14.094104422770519, 14.282651002326427, 14.55645026567875, 14.425996465486946, 14.247489799175268, 14.577661449301463, 14.171615177964057, 14.138150559959351, 14.140453785817485, 14.217873578980667, 13.851490717186534, 14.603376885590109, 14.067628519597573, 14.569609396603749, 14.421892354101198, 14.18606447086843, 14.610286991797324, 14.222404290019295, 14.177463114690175, 14.772381708813604, 13.945813796751972, 13.536192336089108, 14.28796650731713, 14.080941656546544, 14.22686051830709, 14.227778001967485, 14.038976189344941, 14.145769402674473, 14.459255001471618, 14.264209109526853, 14.330397197895167, 14.650372916133163, 14.001328479806302, 14.02193605062181, 14.39571200321637, 14.86536373425616, 14.081058712797484, 14.835973143990838, 14.509614662034261, 13.785978033174597, 14.218416384987261, 15.059772537225614, 14.329773021409101, 13.455808563243972, 14.033106617897273, 14.01086117134799, 14.16314429879686, 14.647739883711514, 14.79299365361564, 14.171276750577201, 14.434363850302072, 14.395519008657804, 14.756313790148624, 14.53292989993164, 14.314182828990615, 14.464415960302087, 14.558541262859212, 14.449437954637844, 14.502407364769912, 14.656588592503017, 14.45088862052063, 14.09056308805812, 14.236811303181321, 14.231726122876996, 14.150265936486838, 14.122433833612545, 14.573169122678745, 14.150500898745522, 14.786006868459786, 14.275586977128432, 14.814900767960614, 14.298983081050714, 14.344781106248757, 14.940281956685912, 14.523325722275038, 14.361925854879782, 14.112913799187929, 14.643600688980426, 14.464776383164972, 14.703064310400354, 15.23140965300202, 14.24925415277032, 14.78178791245899, 14.158468551563553, 14.567587404768345, 14.045160228650248, 13.909743120619018, 14.904771788947079, 14.464864882426511, 14.701568280102949, 14.577561494468098, 14.549581586109612, 14.737440257652876, 15.049080570434281, 14.55662423106221, 14.011578440819184, 14.76264855634388, 15.163176883675128, 14.565235974601618, 14.091915332269688, 14.984113362787882, 14.676029094826172, 13.866299020013265, 14.689983680465387, 15.927299248097773, 14.917433254596972, 15.720855488048633, 15.418944787906206, 15.077852489181057, 14.312334973235492, 14.892481053218042, 14.076714562092736, 14.667594103784724, 15.048784123670847, 14.23970744963329, 14.39318449269954, 14.149865168637126, 13.972954122885588, 14.54854949471653, 14.940895335862596, 14.589664474442216, 14.11410654707021, 14.518360453034058, 15.096717055442163, 14.563630876592214, 15.269331276744076, 13.99825449560425, 14.199799941707067, 13.546127917522895, 14.363289466287146, 14.231699150792977, 14.144718620784232, 14.305210556262411, 14.240327214943347, 14.154756737284348, 14.236725999739331, 14.702599363479576, 14.931131307010636, 15.427790341157133, 14.931235045001246, 14.873751170955895, 14.255804970026686, 15.095188481903929, 14.153451168701471, 14.920787699775163, 14.028921996155889, 14.310174761231927, 15.57768454981096, 15.511896692870273, 15.10798687917088, 14.802647056206679, 15.454949178813044, 14.943240344711326, 14.32048149625778, 13.759952988479913, 14.644261901320323, 14.900051419685157, 14.678209426296206, 14.334390706426312, 14.153628773611098, 13.886696529108196, 14.000652872587368, 14.722629671267473],
},
"2022": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [16.573462144306383, 15.596174439863377, 15.234489173440425, 14.864627971004897, 14.647002560958002, 14.51062709463858, 14.40116555801216, 14.349422690109643, 14.281734213027672, 14.231951373725387, 14.197280476283337, 14.214511676417054, 14.202273839595447, 14.171133907480328, 14.1371714953457, 14.13608879907528, 14.124871224800538, 14.112949183925595, 14.053650535986394, 14.079177083693137, 14.036412783305957, 14.073229173001078, 14.047945299518602, 14.070015795369656, 14.025196613416494, 14.048131120574896, 14.027747521755508, 14.04693966880932, 13.989021728447161, 13.944881767368678, 13.886933089138001, 13.850051890871612, 13.856003976208148, 13.815068083718375, 13.837193877844612, 13.784655598298468, 13.842614301186936, 13.77557561009653, 13.77224160885926, 13.776600344846765, 13.826144019908194, 13.763706308109851, 13.717473009263493, 13.696012101124342, 13.794608115038537, 13.776246769386619, 13.734851495838463, 13.771958143359385, 13.726042906984397, 13.668899883848688, 13.757712183702036, 13.704560348339815, 13.783786123200786, 13.83641193388869, 13.868905832331333, 13.849645348448345, 13.95528051598666, 13.95505863029343, 13.839082246875563, 13.838436454468521, 13.915254552296155, 13.762764025908899, 13.688901609741823, 13.696755257291253, 13.778190465746299, 13.816006543875408, 13.82103497206815, 13.779428665282765, 13.754489087454546, 13.811443840881214, 13.770282324096618, 13.737755151636893, 13.718607326900317, 13.719391275894619, 13.689159138793773, 13.915030059440356, 13.640556357365238, 13.784109189921415, 13.898309014346827, 13.635058416855403, 13.682469750031643, 13.784077058586005, 13.614382036248045, 13.675298494725313, 13.668442871322661, 13.721886395110696, 13.789712241738473, 13.572600625198126, 13.673413438815405, 13.743332722827345, 13.722225182656953, 13.681662164837368, 13.626698965726872, 13.628119315894407, 13.442135002676414, 13.496458815371229, 13.89197866538334, 13.641461535501413, 13.879886838673235, 13.857813671327913, 13.904101718534095, 13.691589314679872, 13.688087764972993, 13.75019330569756, 13.775705815269305, 13.818048957104923, 13.838426569541493, 13.87378344390341, 13.95249789115123, 13.84161364290297, 13.793286673060717, 13.793855375859797, 13.612719779902854, 13.567372345820983, 13.727659226809301, 13.75814093748428, 14.016406773942144, 13.666026498207929, 13.76543524609798, 13.921578363669742, 13.62236868498279, 14.218743767416479, 13.894390824537616, 13.835036107967746, 13.821814354601791, 13.815352044657493, 13.63291347173543, 13.914142076335848, 13.902164591159094, 13.75340398879414, 13.757796232042619, 13.947361314339101, 13.812380150469728, 13.64842644927079, 13.680220428334186, 14.19128594688195, 13.90872163648549, 13.709915874495577, 14.305610405002627, 14.017476771896723, 13.913706939667822, 14.041925551417304, 13.792132210585926, 14.158571611438195, 13.719360968998185, 14.077474378392191, 13.872815383912409, 13.610435935627018, 14.21946622979818, 14.191843568768466, 14.07447374943782, 14.113187584666102, 13.853103994300728, 13.737467173849335, 13.85190476578892, 13.783777206918097, 13.877910972474517, 14.14083721762618, 14.097996519640605, 13.691792923044662, 13.901671052705835, 13.826731782170265, 13.76191264062571, 13.914158935505744, 14.075933365745223, 14.015337137986572, 14.020710391408425, 13.752585714099315, 13.916336207681834, 13.921541427751697, 14.538780447662331, 13.548031644597161, 13.877597908381185, 13.82785734202697, 13.835644605643694, 14.095853895847423, 13.628986120192666, 13.651555792433992, 13.684100113750324, 14.126303911640594, 14.12819638849766, 13.513658817667569, 14.04991026847487, 14.075349509287857, 13.599443864843355, 13.901653490393688, 14.116940866903528, 14.447795487232423, 14.175788401391147, 14.24549480637781, 14.082219655442112, 13.945900149380442, 15.41665075184427, 14.09092252237217, 13.962485170018734, 13.853324684117208, 14.300518130765969, 14.679034583112099, 13.890994648126625, 13.848914731733823, 14.074745430758165, 13.718497892807623, 13.813432378703823, 13.910230373201061, 15.891460291825394, 13.887027453230893, 14.240677540244254, 13.585805239111629, 14.219845664656985, 14.239986387939556, 14.256542956266319, 14.699671416202978, 13.034803839092152, 14.279526808318353, 14.203618557298823, 13.69942973957017, 14.852775292533702, 14.705781491940945, 14.880769009150814, 14.080929986418516, 13.98987102169266, 14.056776098579787, 14.200551441974767, 13.869018580766827, 14.172346721802862, 13.908701829131722, 14.05200499507018, 14.953861829658582, 14.478959291231744, 14.289266616246826, 14.263612965144183, 14.791179486376187, 14.66588280189917, 14.046588278734843, 14.270444904859211, 9.570273738497933, 13.393022696317052, 14.287273030446956, 14.586197406241359, 14.009519095765436, 13.913104133158772, 14.394982072391072, 13.845052383610941, 14.075398039003069, 13.720279996787793, 15.918307331487394, 13.950845891909333, 14.161031303839323, 14.414017113143304, 14.07798698493535, 14.028232685065156, 14.066164268512528, 14.122640702208512, 14.719223348813339, 14.089698444360401, 14.923133171863139, 14.027925447322207, 14.859904976591874, 13.828780032157383, 13.758394371554884, 14.212745217830802, 14.639594923560438, 13.313976437659116, 15.051782211486312, 13.466939926396423, 14.13584577145757, 13.997907138236089, 13.437786071216715, 14.143550112604196, 15.013518092830632, 14.310159900374993, 14.24309503024266, 14.882471681533945, 14.754081514779902, 13.952630289830978, 14.356518350098636, 13.841076292748065, 13.17557406572946, 13.843300304809517, 15.534713921188569, 13.489501667105461, 15.323003263489925, 14.405831914476117, 14.260543641985588, 14.23381356656912, 14.062976691107115, 14.71037740234297, 13.652258277537488, 14.414142143046723, 14.012733020591691, 13.738429608775572, 13.795105640310114, 16.905541410998413, 14.363532045313905, 14.340997597817381, 12.644035012321227, 14.210848531614518, 14.655835827595727, 14.359502747186784, 14.124354988618265],
},
"2023": {
"x": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300],
"y": [15.4293630385597, 14.827776633211421, 14.600432832118155, 14.43330043760322, 14.30586483681026, 14.203397641081045, 14.140361413924607, 14.101673126860582, 14.05840021694595, 14.033693337279875, 13.990003714671388, 14.001106927608756, 13.982387676044238, 13.960424890216352, 13.941694305252629, 13.928958405693843, 13.922871327026984, 13.90749356497257, 13.883187320364065, 13.870538613453949, 13.853682922141118, 13.839326154723096, 13.841949693311191, 13.851284862386178, 13.853606323578846, 13.851840301257587, 13.86166226046842, 13.872513892742713, 13.867295530090015, 13.870385212514083, 13.868578068850889, 13.848685425568009, 13.838736750620761, 13.825182992628129, 13.795340100698754, 13.809629502148145, 13.767911089744738, 13.75599639262174, 13.75925151191706, 13.751975433642748, 13.731931931502134, 13.714316407794309, 13.730848265421725, 13.681606796845, 13.670846152397202, 13.685040324991581, 13.687292733648798, 13.645627677729081, 13.635021438002346, 13.670103747374988, 13.62246956240464, 13.658574692934657, 13.65219324836813, 13.663836335892329, 13.666948307267594, 13.642643510414398, 13.672961601819406, 13.663525877548398, 13.667436573958156, 13.687522639036205, 13.647544546546508, 13.670704172336292, 13.643000490240736, 13.667107110344569, 13.660218070172265, 13.675550822990397, 13.59092599672469, 13.619850375757148, 13.651551988902462, 13.684288098100867, 13.599046453546292, 13.580905963181452, 13.620956017533885, 13.648408527460056, 13.60249514150298, 13.568078301644128, 13.6145797181229, 13.647719674647586, 13.531493703586886, 13.609260600121146, 13.687447710013837, 13.602215210547463, 13.563220813507392, 13.57176728376717, 13.664222431811334, 13.586259696651297, 13.571127927324502, 13.692682818016978, 13.599437831977406, 13.646024625160337, 13.645231022004468, 13.582760709524955, 13.597408008025921, 13.640791164279545, 13.58016693386471, 13.664139165839629, 13.553901320176095, 13.616471379535914, 13.574418885444663, 13.62049913139043, 13.595296717779055, 13.618520397945241, 13.619083853308746, 13.549404239296155, 13.515187660214737, 13.728226318739061, 13.618609127026419, 13.638021829042664, 13.684199453984574, 13.707676555543845, 13.541617144639595, 13.703834138276244, 13.519323579997998, 13.6031555746482, 13.56414632339735, 13.711610914557605, 13.529701508251849, 13.631734977501925, 13.657120297408555, 13.58489249685537, 13.64403630157245, 13.608235747585796, 13.512110498832085, 13.846959297419959, 13.488917791046676, 13.696834245583917, 13.61507766454769, 13.565377802829648, 13.790197786574588, 13.564346823139237, 13.5342157764538, 13.65148446769962, 13.570646849759997, 13.538878864721305, 13.608980817839505, 13.664477237928127, 13.532411719398455, 13.737437273256564, 13.519816331488395, 13.764368990604515, 13.653588472445573, 13.5302540795639, 13.57561188810073, 13.647608383912683, 13.728643890026184, 13.710097008284352, 13.75589344505474, 13.682502650080487, 13.684339202206958, 13.86749342599449, 13.645786331176726, 13.660817039716257, 13.638011389586667, 13.732387353692099, 13.687686391049773, 13.94728981311995, 13.614547412507926, 13.460552695752389, 13.857074456574574, 13.660326212827487, 13.718393121459215, 13.76973846040823, 13.778762864123724, 13.656959991670522, 14.214462072816556, 13.622739420457773, 13.645227120727897, 13.687497326712435, 13.649272554141808, 13.503550000252996, 14.052494437028535, 13.580311058963396, 14.14017314736784, 13.64182000911326, 13.886936632170794, 13.942674178813384, 13.801754161915504, 13.931144818346747, 13.584651322907064, 13.960391830857033, 14.178873989248789, 13.645923431288137, 13.97423140921055, 13.669569353257327, 13.915331700422486, 13.827145087821776, 13.736836827537942, 13.74766543270326, 13.770318536193258, 13.721033560006754, 13.710191655241298, 13.72744974500201, 13.845900599098753, 13.678446729208007, 13.902643304888189, 13.885717101405227, 13.800092557910519, 13.421930828385424, 14.22006344809192, 13.879986040380091, 14.134020605148754, 13.828712030750555, 13.713190050100788, 13.670401789346878, 13.948423234333882, 13.84481181587886, 13.818908981670926, 13.74582730003707, 13.94097096205736, 14.180988587482524, 13.792218775776533, 13.684855627228844, 13.881739174231223, 13.998746647008945, 14.576445279868192, 13.977974630190932, 13.537548783758675, 13.793279757360363, 13.712674433009878, 13.758696209000801, 13.912382937440464, 14.340144810498328, 14.03279240397904, 13.889996587251982, 13.862065986515601, 13.712302898403514, 13.797613183843772, 13.847295441275936, 14.422108283887903, 13.900169262027397, 14.247783256416513, 14.02056653491548, 13.99526374998638, 13.69358071050138, 13.828640744267325, 14.01321596237364, 13.824657271537166, 13.683602248925892, 13.933987455146445, 13.993921243916123, 13.720966315955001, 13.890770809341586, 13.426961283787957, 13.789886238259456, 13.904131224083592, 13.697354217113691, 13.710497864728065, 14.683006531539148, 14.315759264484964, 14.034699751802846, 13.890948305458895, 14.038907287423818, 13.298757873288494, 14.037824844116592, 14.162250808384407, 13.947058195824253, 13.806653590867487, 13.980386450979841, 13.667273172120268, 14.201737731565034, 14.447849496372461, 14.018697147254176, 14.002315381014313, 14.15231239942244, 13.73719042552595, 14.033594655653038, 14.03087108296539, 13.782578520604822, 13.660908086958573, 14.205910336717215, 13.930322566343703, 14.300591211697906, 13.808749910964323, 13.8076208806989, 14.169819824542373, 14.067537576689853, 14.306124453553517, 13.56827905088618, 13.592634469105525, 13.789396713937975, 13.853464456609156, 13.855768885291056, 13.710464058237172, 13.641314331273772, 14.295528532894258, 14.04977108393012, 14.153384726345907, 13.385524853965638, 13.484650040422745, 13.831061312642468, 14.15298734516191, 14.20289531849528, 14.116529526532855, 13.767652893233096, 13.715924776449405, 14.649027392365024, 13.603310028324861, 14.10228343978809, 13.704762155010586, 13.731715455443299],
},
}
fig33 = go.Figure()
for year, year_data in data.items():
fig33.add_trace(go.Scatter(
x=year_data['x'],
y=year_data['y'],
mode='lines+markers',
name=f"Year {year}",
line_shape='linear'
))
# Update layout
fig33.update_layout(
title="Perplexity vs. Number of Duplicate Documents Over Years",
xaxis_title="Number of Duplicate Documents",
yaxis_title="Average Perplexity",
legend_title="Year",
hovermode="x unified"
)
graph3 = fig33
##graph 4
# Data
data = {
"2014": [[1, 2, 3, 4, 5, 6, 7], [16.82572561037536, 15.568688184472002, 15.81492345088457, 15.206355227978303, 14.957766124315622, 15.0626618458479, 14.868694970954875]],
"2015": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14], [16.89591942700286, 16.065453332424525, 16.27127382267357, 15.98729389349345, 15.820859416672139, 15.607600911192797, 15.110138119917048, 14.775887397593593, 14.660655022362318, 14.588547400309, 14.55020529201701, 14.60127048285861, 14.629467286160864, 14.724440862889]],
"2016": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23], [16.937063110995666, 16.159401045667217, 16.24178377816029, 16.073494730595225, 15.774737597940442, 15.621947075605162, 15.652955728810767, 15.490807185265608, 15.107547930881259, 14.976802818244652, 14.84517846815987, 14.839768640933237, 14.794471716989547, 14.63826024444852, 14.57725826735028, 14.446983381957654, 14.357863327746747, 14.370146480850329, 14.207796791759758, 14.067617540013867, 13.968037234662484, 14.015386030957798, 14.240341030736081]],
"2017": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34], [16.731010662045737, 16.534529481773635, 16.624818021435388, 16.6027968727952, 16.309053610063657, 15.897351021398148, 15.28125612085656, 15.247650153402024, 15.254523671401472, 14.914419299947483, 14.734687782223004, 14.78413990847839, 14.632065773173599, 14.553246204352645, 14.566566717229817, 14.598997883895558, 14.630837564582592, 14.577208610859856, 14.519413074334954, 14.378498447103155, 14.230943065441672, 14.21486380216727, 14.267422050116286, 14.281606945252474, 14.285535565035358, 14.267266452303197, 14.183136371592417, 14.148268300539986, 14.21036055571916, 14.403658436211263, 14.07740471177247, 13.978242496152737, 14.002633023111342, 13.921442192327655]],
"2018": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46], [16.36546565307699, 16.40198820766892, 16.223802437472045, 15.876190858008776, 15.67866795074444, 15.06202559354935, 14.90395971116697, 14.678203166785968, 14.584307457124408, 14.566603376547835, 14.716527825876883, 15.325114798824192, 15.153635738494962, 15.02749650458142, 15.001501640976104, 14.928437622685198, 14.82066263298361, 14.821925418558614, 14.766538823073754, 14.742836908980854, 14.56365471694568, 14.676889493065413, 14.554327268897188, 14.532997117657752, 14.424665661602356, 14.498427111442304, 14.503622356394782, 14.465294436509943, 14.238209588803269, 14.138531026657803, 14.11633073136879, 14.139167312709546, 14.018054330979824, 13.99555243574117, 13.944770385859002, 13.893353445566834, 14.062344563726617, 13.93602183204734, 14.021518977400955, 14.205273479299835, 14.476114932821364, 14.707612238290547, 14.403724822460271, 14.134464626849528, 14.444143421676507, 14.372513155481114]],
"2019": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58], [16.430122616908218, 16.959894024725404, 17.530494343918114, 16.868158683774006, 15.881925908038214, 15.534071764082064, 15.131599277920825, 14.912091189771328, 14.670101527122705, 14.591504400695127, 14.405999306200146, 14.445437111619501, 14.460150974610382, 14.484377024024335, 14.454923933668082, 14.419367200283267, 14.413528998792588, 14.362242243379736, 14.326113076490996, 14.296366861932851, 14.241137636937816, 14.199018730937293, 14.229939247452181, 14.136900232594229, 14.118747592622253, 14.084639441555339, 14.215359965064522, 14.321335291582407, 14.324483466296755, 14.22250351319463, 14.086153725088337, 13.835546707594524, 13.861133395338289, 13.943395906095482, 13.924621051048792, 13.978711084778347, 13.905837106100599, 13.895058375110484, 13.965442215811176, 13.960110799963521, 13.99641930380663, 14.036529641608142, 14.138294825947872, 14.3360579115842, 14.381214824082278, 14.389155929858507, 14.645175007732961, 14.477402464547152, 14.51444505845359, 14.452153618691407, 14.369430039316658, 14.777857326947053, 14.919588044831785, 14.44053007434645, 15.18596756335163, 15.362545102466955, 14.19095014510728, 14.974116009038374]],
"2020": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67], [16.370879996210345, 15.8912555858172, 15.30157381561316, 15.461362783916728, 15.499602726814674, 15.329200065422526, 15.15238010628145, 14.763158730707703, 14.554444724050978, 14.391542531017906, 14.36062417910266, 14.38408773153761, 14.326398992080678, 14.30559398460406, 14.296620966953196, 14.257641523080219, 14.239785079623704, 14.257963344315925, 14.242187947481078, 14.227247960684823, 14.246528806504662, 14.218691858857001, 14.119027315863725, 14.16049126937658, 14.1393355330565, 14.045446781499932, 14.157717833319223, 14.118844952908322, 14.196031529646438, 14.213151244097208, 13.961708881578405, 13.933434907040512, 13.851967361230258, 13.837032186918211, 13.83609308408103, 13.74084041793037, 13.725470779946555, 13.828238575588477, 13.821753201986834, 13.81152543072784, 13.848104780631868, 13.867032605563987, 13.91567734841802, 13.951714207206178, 14.049401288158215, 14.000020142532282, 14.097054408814992, 13.973915015915077, 14.001305792897133, 14.144447551433583, 14.259794771973013, 14.451580305620148, 14.51523695971965, 14.491781843544896, 14.282130970472108, 15.107471010795585, 14.507809743534436, 14.521069179252333, 14.434674191986367, 14.608533166251355, 14.638444470251414, 14.533496524040576, 14.798278071146985, 14.426231926251468, 14.697215649677831, 16.000970311873413, 15.962112261396376]],
"2021": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76], [16.40998076014569, 16.214064988829055, 16.102423371338, 15.61960664445389, 15.365806380257993, 15.258505702187641, 14.987691202287733, 14.702934989974425, 14.47618699872759, 14.27294780183996, 14.149902488372312, 14.205153888507418, 14.180406523176302, 14.179162306409303, 14.148172641684653, 14.146789562089962, 14.13207546325995, 14.095045629570848, 14.11059784727951, 14.099774964675055, 14.123404475264994, 14.04205645064162, 14.071957340879374, 14.076002230293538, 13.997579723886533, 14.055982816834012, 13.969566421026498, 14.044197137615983, 13.970800321234117, 13.991254850488748, 13.882773884993162, 13.878676595695538, 13.738534890032913, 13.731264526843741, 13.743931319054433, 13.744385448034985, 13.654269807446708, 13.649793785589242, 13.659669286701138, 13.70981039304929, 13.706017327034093, 13.793638036031938, 13.820253019972634, 13.895844222751752, 13.805532005211788, 13.879969410141696, 13.918667434527839, 13.905080860878972, 13.928649229766597, 13.92971106121914, 14.027211058825408, 13.869387194129342, 14.002439547556614, 14.197189244986761, 14.171599593405029, 14.189026952927275, 14.317088413682809, 14.266884102594418, 14.419819049388389, 14.394102801112203, 14.28486572885178, 14.463889605992794, 14.33813105749612, 14.49991185507524, 14.143521529230846, 14.020378845184027, 13.929518285869944, 14.785566241242854, 14.273112202537183, 14.214773231874327, 15.148250280334482, 14.563912283938823, 14.552655401047055, 15.103655560583926, 15.10169368308145, 15.51226670578053]],
"2022": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82], [15.816438075969113, 16.09580666529207, 15.996333190110686, 15.943848815283268, 15.656093894572393, 15.117394092950262, 14.78287160043243, 14.543141634926663, 14.305058018637094, 14.125611753367533, 14.020067247129745, 14.009478965058692, 14.001669618595649, 13.985248005578073, 13.973728782674742, 13.977117237954532, 13.937202607945661, 13.935625722728988, 13.910945770197134, 13.893835251097759, 13.89679037463924, 13.881064193374637, 13.904299030382344, 13.904090626213797, 13.888526913768459, 13.838568567514612, 13.829178463025315, 13.835043064902585, 13.81757570730985, 13.776370281729609, 13.762638676519028, 13.755074572847866, 13.70045870380896, 13.636805800875507, 13.621671132216942, 13.633589926779942, 13.602080944483301, 13.555848610415586, 13.558904660155596, 13.515784046498322, 13.609062507319349, 13.583137427458137, 13.483909540769114, 13.552547586090368, 13.598431457952788, 13.553603210491028, 13.57678073518515, 13.638974685844074, 13.536340332636364, 13.665029112653803, 13.792584632059397, 13.694618901117751, 13.76826442085512, 13.712141215124436, 13.606927085734855, 13.715251358141709, 13.832372298562165, 13.833057817510603, 14.158282794215733, 13.720855464980609, 13.803417413649743, 13.969854384335488, 13.892171370159991, 13.778269401162506, 14.338216122354686, 13.954993084366778, 14.124621205791534, 14.23737489353975, 13.735373769168353, 14.680642990647039, 14.955805632680471, 14.657580957949671, 14.515390831490835, 14.664661248141265, 14.497750142907295, 14.662641057721332, 14.889760996859867, 14.044358215057608, 14.201835355776206, 15.739648390380614, 16.209835613545337, 16.152241961523004]],
"2023": [[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87], [14.789164834058647, 14.816940361326127, 14.859128791010018, 14.874353138456074, 14.799558338831533, 14.521955875294703, 14.344439116861626, 14.188768591243738, 14.068214649484007, 13.975247139727212, 13.892361806680233, 13.873812682757855, 13.855623423924795, 13.834034581531931, 13.820704041290954, 13.809345726828388, 13.799809305012891, 13.783733425983497, 13.777650159371621, 13.769295261894937, 13.759922637457876, 13.763157283741176, 13.746892077566258, 13.76043892787152, 13.780799936451544, 13.769219249583701, 13.776107653632701, 13.791395904208231, 13.796017873163873, 13.793511195440795, 13.752832872061946, 13.744140909741626, 13.708291014183953, 13.71791539682566, 13.687888739966342, 13.639779981608498, 13.60820604942688, 13.647619221630219, 13.586732110007599, 13.578824230397977, 13.56286775189147, 13.54887132723798, 13.528005768240323, 13.562278263274335, 13.50423334091739, 13.534814940452101, 13.500524731734556, 13.50415611423685, 13.539792624454682, 13.524280636462276, 13.508635254011224, 13.559898859515048, 13.52340866000508, 13.580987242413414, 13.55406078682323, 13.51949982056399, 13.554946096777044, 13.582384634669271, 13.596405485832927, 13.56397157046417, 13.50076890156882, 13.5996552161972, 13.640177272640555, 13.488306430506505, 13.561144538501607, 13.538229936728902, 13.523274401746107, 13.549803559768709, 13.473822808409837, 13.604196078834873, 13.495970010370977, 13.511897788189435, 13.480753572940852, 13.790758773339501, 13.507154643917646, 13.451282820788672, 13.690887252346345, 13.752272760476266, 13.844969190718858, 13.547043033265561, 14.011397551896307, 13.686917203544905, 13.87527368747695, 13.86828531076653, 14.200910595590095, 14.228639023300655, 14.830844952562549]],
}
# Create figure
fig = go.Figure()
# Add a line for each year
for year, values in data.items():
x_values = values[0] # Dumps duplication count
y_values = values[1] # Average perplexity
fig.add_trace(go.Scatter(
x=x_values,
y=y_values,
mode='lines+markers',
name=year
))
# Update layout
fig.update_layout(
title="Perplexity Across Different Dump Duplication Counts",
xaxis_title="Number of Dumps Duplication",
yaxis_title="Average Perplexity",
legend_title="Year"
)
# Show figure
graph4 = fig
#graph 5
# Data
data = {
"2014": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.993513389984585, 14.011578085529056, 13.85873136108517, 14.36377987125267, 15.699475274542996, 17.613998844460845]],
"2015": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.471687658163091, 13.778144432139904, 14.021706888859466, 14.434268636964038, 15.738483406741972, 17.840661656870072]],
"2016": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.438546004899326, 13.785269267918505, 14.181493168285378, 14.616607805125264, 16.2678738383595, 18.109357061988614]],
"2017": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.567324655164636, 13.93914285288248, 14.443292405833132, 14.749691886458645, 17.212768319133406, 18.09921482533539]],
"2018": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.79413309579284, 14.047920703385312, 14.732393204862687, 15.245556746489475, 17.523092460922793, 17.979494192145445]],
"2019": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.755894620552562, 14.061328527771183, 14.921709511248036, 15.746644701243795, 17.6501867538675, 18.65346532837317]],
"2020": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.808975955128705, 14.075864850752456, 14.857958945409392, 15.491042607097183, 17.423084409503307, 17.519155049505677]],
"2021": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.97373049489925, 14.044277002343486, 14.943719820749207, 15.730257843247038, 17.289265921502192, 17.00252056705296]],
"2022": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.865869368871065, 14.028544413850119, 14.920117888974543, 15.693608290158098, 17.33525765189499, 17.724085896005107]],
"2023": [["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"], [14.499660832882716, 13.98118612654411, 14.86417535071986, 15.440738449977292, 16.94447963146979, 16.40768745134217]]
}
# Create figure
fig = go.Figure()
# Add a line for each year
for year, values in data.items():
x_values = values[0] # Buckets (duplicate count range)
y_values = values[1] # Average perplexity
fig.add_trace(go.Scatter(
x=x_values,
y=y_values,
mode='lines+markers',
name=year
))
# Update layout
fig.update_layout(
title="Perplexity Across Different Buckets",
xaxis_title="Bucket (Duplicate Count Range)",
yaxis_title="Average Perplexity",
legend_title="Year"
)
# Show figure
graph5 = fig
#graph 6
import plotly.graph_objects as go
# Data
data = {
"2014": {
"x": list(range(1, 88)),
"y": [16.82572561037536, 15.5729544573954, 15.76916326514348, 15.186302038671778, 14.936809838870326,
15.001743417469209, 14.864349796797914, 14.66090559477578, 14.50521188055062, 14.429989457983405,
14.44107090883399, 14.523867649934015, 14.515728033558386, 14.52893012438083, 14.3872701582485,
14.225935934612775, 14.161270385625249, 14.193552536884559, 14.107559093534066, 14.045872060793387,
13.98606116940174, 13.996535021107574, 14.068451357323962, 14.095424742580935, 14.104930415857556,
14.164512298046297, 14.205441475464172, 14.190478352923273, 14.080583365838212, 14.017757335246573,
13.914391577020234, 13.860680803527211, 13.709718483172745, 13.671102868173037, 13.641967377585344,
13.610477152664181, 13.589404166531697, 13.574364349432603, 13.588675304139612, 13.608431855502594,
13.602022539289871, 13.577550630742646, 13.5388901112764, 13.586266218232485, 13.543364159175262,
13.530598188250648, 13.5415846166861, 13.518331785106323, 13.533012163841759, 13.505063315507076,
13.546433152010087, 13.571041150558058, 13.538517630502037, 13.589716598763259, 13.542375131110317,
13.551229472032986, 13.577615792486487, 13.580265758570304, 13.611791663131656, 13.563252675321158,
13.496554744217198, 13.573611486889268, 13.619417346323402, 13.500110681053787, 13.606494277444822,
13.51758492586705, 13.509290876196683, 13.637653184648098, 13.453927168439604, 13.677712744726351,
13.586150504785195, 13.508649309624724, 13.427111951862848, 13.800940000499685, 13.540635679680195,
13.506572883300588, 13.723957125925423, 13.69941910754067, 13.830916622405972, 13.61477646698581,
14.050670659742897, 13.707871486489617, 13.879222794014064, 13.838270894748867, 14.189041030733511,
14.221410654489386, 14.830844952562549]
},
"2015": {
"x": list(range(1, 88)),
"y": [16.89591942700286, 15.993069023056673, 16.243349252734195, 16.110419584106467, 15.982982023217136,
15.780412452462956, 15.311492684065183, 14.985452841100962, 14.736003632647204, 14.643740634573437,
14.581818722981641, 14.61206887509358, 14.60310477647637, 14.58283877743656, 14.456739625003323,
14.371166857791525, 14.31983561927552, 14.324744175103753, 14.230377570291408, 14.172400195643684,
14.074979303784101, 14.06637978929149, 14.129765267158923, 14.144182701579643, 14.127393749297303,
14.170954937339665, 14.198905272060887, 14.177619224859075, 14.073073703918407, 14.014468948454157,
13.91281662387792, 13.866047771993978, 13.718029097387152, 13.680243640703553, 13.648583428855366,
13.620824659009545, 13.599252706541842, 13.582576892167687, 13.59570512552313, 13.620006512175056,
13.61371460828329, 13.58747315850088, 13.553159834309662, 13.595855683037627, 13.555194351409998,
13.545131292437988, 13.55533031134806, 13.53176578053929, 13.545627399503374, 13.52324264159441,
13.56019390924936, 13.584765148382376, 13.567436274268637, 13.613633832001781, 13.56834903785532,
13.564886395063189, 13.585588042180726, 13.59211972866627, 13.636661940057897, 13.583630103422175,
13.517621040928827, 13.621723155241801, 13.644527863238189, 13.52150990576411, 13.63020958334669,
13.54428783928786, 13.53725206048877, 13.647484409192606, 13.490519893023992, 13.683557383784123,
13.623112173204985, 13.558759376238477, 13.498783050518579, 13.848023903419993, 13.565373956282203,
13.524041036650617, 13.747948319462374, 13.741843984167335, 13.851135619804712, 13.592769333513887,
14.059753132138649, 13.714031759165366, 13.87123035917049, 13.863386012094978, 14.205561271109257,
14.22054632648026, 14.830844952562549]
},
"2016": {
"x": list(range(1, 88)),
"y": [16.937063110995666, 16.13008897039131, 16.461262248281052, 16.22524701869722, 16.07512945589454, 15.81169518738005, 15.401255747943388, 15.290536877276061, 15.189318784104037, 14.892680148096144, 14.874941231589043, 15.197590171491255, 14.874108876718813, 14.772934695761471, 14.717224961147101, 14.579633089306332, 14.50655782645537, 14.435927961362305, 14.348044387963261, 14.266921166623963, 14.175146176030633, 14.155440421923364, 14.193605317227636, 14.198019720781069, 14.163648287310021, 14.204946332399512, 14.22475496545738, 14.204790263028082, 14.093780256147781, 14.034401436018054, 13.932675009733511, 13.882052276281941, 13.74135284070189, 13.70495830877455, 13.67945861250605, 13.646286996486673, 13.62871684949669, 13.617194154766194, 13.625737566495989, 13.647397208854517, 13.644435990272989, 13.61908161116556, 13.579719730143186, 13.62432154955091, 13.586802920088218, 13.575059311720242, 13.583160915709527, 13.560181345211744, 13.568315314106055, 13.572213203030019, 13.592269857254504, 13.615523084934742, 13.59675061839986, 13.652762841246345, 13.605972800137922, 13.599797687151108, 13.61588443406148, 13.635017100727426, 13.67797680326676, 13.61550407767841, 13.549525029810649, 13.646426348264216, 13.685855644417883, 13.557730732623456, 13.654494917893674, 13.598966492740331, 13.596850824269557, 13.67606211623268, 13.531829321066132, 13.736041595486006, 13.66155540112554, 13.622341728732476, 13.576672515819212, 13.865689693447742, 13.593823653503895, 13.549026603238106, 13.757031791888123, 13.764537976595522, 13.887154797262793, 13.612757682949674, 14.062295065487943, 13.702773103249053, 13.887824206090368, 13.868971352456365, 14.206954791830077, 14.23126212995893, 14.830844952562549],
},
"2017": {
"x": list(range(1, 88)),
"y": [16.731010662045737, 16.66489684871436, 16.568296606954515, 16.437855314705402, 15.977926296110395, 15.325063337637374, 14.928282696800443, 14.738959466164316, 14.615199372327732, 14.491701731769748, 14.38837234689295, 14.579509085357541, 14.486096782010588, 14.386514742964506, 14.328783257345318, 14.247944995447972, 14.19065895107961, 14.17354382678591, 14.151039883117742, 14.102188877847754, 14.076004337973803, 14.044354444990084, 14.021645356806046, 14.030621721602873, 14.020477810045843, 14.031701258052667, 14.04171400712978, 14.043074023094446, 13.995387210524175, 13.989640260692584, 13.926046401793304, 13.898066232753337, 13.796470656270547, 13.780012350603617, 13.751151287426516, 13.721059118625764, 13.704432047525122, 13.69302750426319, 13.691196863860615, 13.720022791468368, 13.713297481354758, 13.673499420782665, 13.640347860637759, 13.689388371843485, 13.642074890212623, 13.641953443289871, 13.639384501232673, 13.60468612819505, 13.615030447011026, 13.622517997479935, 13.636776517056651, 13.646713543499644, 13.642553869063399, 13.670086160771016, 13.629072087229995, 13.644023633211804, 13.662921343294622, 13.663979848619121, 13.72041962705924, 13.653883587863746, 13.598487708047587, 13.679216506372514, 13.729500926935524, 13.59184630155257, 13.670119193506638, 13.606578039356629, 13.58912160797548, 13.662329284657567, 13.534494438724048, 13.673846450840824, 13.63996498360781, 13.62694917771645, 13.569375400530905, 13.86109411358942, 13.573009950696505, 13.521398904176095, 13.737765136250907, 13.73947064730135, 13.851957566097216, 13.591944403455463, 14.047275913134344, 13.706497861963147, 13.8752419700006, 13.852410962776265, 14.207173465915606, 14.225732066062445, 14.830844952562549],
},
"2018": {
"x": list(range(1, 88)),
"y": [16.36546565307699, 16.45401827941957, 16.3552192563823, 16.073789764186234, 15.71971918795885, 15.261114192297178, 14.951234486665056, 14.689367076535861, 14.518128318670973, 14.390099476525092, 14.259121880707934, 14.322341013577667, 14.269149775349785, 14.22657504335791, 14.17831063712821, 14.129362751026134, 14.091233660298563, 14.065699851355896, 14.045897986269743, 14.009922933506038, 14.008946008943926, 13.986948087868985, 13.96676299568112, 13.974589147811011, 13.981182540647008, 13.988178680995725, 14.022037638217835, 14.067236496270958, 14.02773875655739, 14.008012013219155, 13.96047327707988, 13.941545910212922, 13.874283503971592, 13.872319571354534, 13.848819496944696, 13.818989807687052, 13.795278583261243, 13.805582941066566, 13.77608884517368, 13.808300541084458, 13.801215406173135, 13.77460925841957, 13.749962347541663, 13.788585819175475, 13.738353323889454, 13.748267848539136, 13.743909070082335, 13.70094253905992, 13.695566142077064, 13.715120021384273, 13.717879111446795, 13.729262136679193, 13.722322759559463, 13.741817617080867, 13.695797507509411, 13.7303223115229, 13.721142524694981, 13.731183807899438, 13.774251666658795, 13.703270226348065, 13.650013779539329, 13.737063911330598, 13.771299601507252, 13.61035413656345, 13.692911759706188, 13.645478213049078, 13.632427440948039, 13.685353855181187, 13.536951397436473, 13.722996576069109, 13.684668668827719, 13.654991978676541, 13.571293959475197, 13.901327051067131, 13.590409846183357, 13.555280671785631, 13.801358266402337, 13.759891436212222, 13.877447278904341, 13.601070277589484, 14.053793686670241, 13.74239252938787, 13.856380061979658, 13.86653563573893, 14.207967017152274, 14.2295264543635, 14.830844952562549],
},
"2019": {
"x": list(range(1, 88)),
"y": [16.430122616908218, 16.875051086326838, 17.248145032061572, 16.40581365808372, 15.774430714575988, 15.432767149001718, 15.145763219926579, 14.799558762994192, 14.497109888060386, 14.314004689580893, 14.165230875628717, 14.132599998200735, 14.112646717547443, 14.08981745552461, 14.071275351524006, 14.055953745980803, 14.036895611705631, 14.010822458772108, 13.994688510028434, 13.981568297524671, 13.973131490690857, 13.960851307613188, 13.950407299676206, 13.957766631077842, 13.963923860192619, 13.94968503524683, 13.95489134897448, 13.977622152992309, 13.976393846039631, 13.993956516762394, 13.953670292574621, 13.955101324894523, 13.921696126960061, 13.922513268517232, 13.904228567859588, 13.878944392338122, 13.836936389689685, 13.858488953034747, 13.826255387319108, 13.821733497321453, 13.810924551284534, 13.788436757401502, 13.768651883781944, 13.803381095808694, 13.749861429185598, 13.766023951467982, 13.755033569040371, 13.733275547786105, 13.72346431637034, 13.742887974648536, 13.737327971523658, 13.755247742270127, 13.742754785888708, 13.774345891745789, 13.728724104358966, 13.745302135799491, 13.734638471314582, 13.7609514564792, 13.779567132297817, 13.70364460650017, 13.66329614928825, 13.77103900712268, 13.794109949823657, 13.621080526861675, 13.685285026135551, 13.645675824035878, 13.640254544445797, 13.696632265084162, 13.557089062423215, 13.72744068935533, 13.685312250371716, 13.691487365024885, 13.609612243178898, 13.871590990738959, 13.602896495117179, 13.545298074232608, 13.754105324744064, 13.784568829720575, 13.848250131622855, 13.601751414645124, 13.999031818997702, 13.692806805453536, 13.82245603247244, 13.856124808569652, 14.187925457414872, 14.223944149123374, 14.830844952562549],
},
"2020": {
"x": list(range(1, 88)),
"y": [16.370879996210345, 15.889055037950405, 15.432190412594073, 15.505691782112706, 15.423788890368417, 15.240064903157505, 15.043391085766707, 14.761714938396674, 14.47962007552951, 14.234133021817758, 14.123336425923434, 14.080419066871459, 14.063393745363433, 14.051331002053393, 14.037897577554489, 14.041538161067855, 14.0145622985008, 13.995935362579743, 13.991791105247946, 13.983842732394558, 13.977020615720546, 13.966291155429351, 13.953143025987027, 13.969577694685832, 13.972274556692618, 13.967416689282992, 13.962867288546066, 13.983570820646507, 13.983105305183239, 14.007290834079699, 13.960017748248399, 13.97014807600787, 13.939131974855112, 13.931242142373641, 13.923784747364268, 13.884450633737517, 13.857702881178751, 13.86969533995838, 13.829427121984313, 13.834994065394055, 13.821808671828476, 13.790151002027123, 13.76907986225701, 13.797444154897008, 13.749256987787135, 13.766070221096518, 13.759434645334379, 13.731706353193822, 13.733304557490518, 13.740468199068971, 13.721036580994003, 13.756529386584269, 13.732150648873972, 13.763427764616013, 13.73375582951499, 13.719098308155836, 13.749579407257558, 13.79960240262951, 13.827660100575278, 13.713867309731741, 13.67110069190749, 13.813210464397173, 13.820210906230622, 13.646742569819427, 13.707821135028649, 13.694993324955234, 13.667868455414132, 13.744045961641467, 13.60673607296966, 13.735891876117867, 13.708771958501817, 13.68966975607113, 13.632689223663043, 13.935886970943438, 13.636130655693483, 13.612174548563797, 13.772534936472159, 13.807161877232101, 13.85457230058511, 13.663896751660037, 14.090271528268559, 13.73950346577504, 13.889399028025398, 13.875344815512134, 14.21697484183684, 14.23511142666353, 14.830844952562549],
},
"2021": {
"x": list(range(1, 88)),
"y": [16.40998076014569, 16.131563389687667, 15.926483480935136, 15.698720075567504, 15.493215409831992, 15.18004517433272, 14.889295559356292, 14.61434191320944, 14.373082577547928, 14.186230894539502, 14.090058332837668, 14.023657754832897, 14.007435410828263, 13.98510741208859, 13.970141824822582, 13.969314479688267, 13.946015227855732, 13.928771902280433, 13.918094740825536, 13.904271041635251, 13.898094980435907, 13.884683163944276, 13.877957828236978, 13.901423741421022, 13.906131144086045, 13.902626593900637, 13.894640462593705, 13.918502460807465, 13.918292173412722, 13.936267540996683, 13.893769797887094, 13.89937529564544, 13.863770002450618, 13.867997609697417, 13.848933342732614, 13.815022252718682, 13.791564536076104, 13.785299092567266, 13.757852960538305, 13.756401654592215, 13.759718968653816, 13.733437497507486, 13.700263326582155, 13.741373305941403, 13.675414218993899, 13.706510616734628, 13.679167854117077, 13.691416726739856, 13.672658642514545, 13.70674777789251, 13.677889859468195, 13.696385833947582, 13.676118387776745, 13.712359839755743, 13.678461938862087, 13.655240869170136, 13.686341276950634, 13.718978062873198, 13.727316226517866, 13.656066612805246, 13.613789363715679, 13.743623408755314, 13.736977834220136, 13.602716719881093, 13.663563667635234, 13.62881219522605, 13.642571996285401, 13.684891127715069, 13.552729633336378, 13.722320681269425, 13.688784634409584, 13.681265629893907, 13.655688148500278, 13.889373816531247, 13.612825342345905, 13.606765349789637, 13.795350032043327, 13.82650292060858, 13.841286651582926, 13.657986925155127, 14.058341453040232, 13.751822923564026, 13.936886101042488, 13.90058603143137, 14.193189631919063, 14.225976069809075, 14.830844952562549],
},
"2022": {
"x": list(range(1, 88)),
"y": [15.816438075969113, 16.120385966332037, 15.882429676047822, 15.754141510831133, 15.3879948181939, 14.847440397508679, 14.559122186153141, 14.392608974240208, 14.271479310233566, 14.151814366776497, 14.033446724531911, 13.971139835079242, 13.946657171368635, 13.923168976370057, 13.908213326289514, 13.903962921781009, 13.883435189687164, 13.868214256361957, 13.853316203275403, 13.850156274630233, 13.83800413007661, 13.828456929678238, 13.823667080256051, 13.837379627152984, 13.85468762648662, 13.842118819095077, 13.846068401970452, 13.866145193860882, 13.87683103331106, 13.883902318309158, 13.843314542816382, 13.848955212935406, 13.825679672773983, 13.825203585467685, 13.800650657685432, 13.771987156235094, 13.745277332204294, 13.74899618896188, 13.710350289788519, 13.699009636752562, 13.72574984380712, 13.69379612714152, 13.657631333739795, 13.687110795197487, 13.641654848107489, 13.68555427745178, 13.626523037803157, 13.656569173850187, 13.64357081552712, 13.655564923630237, 13.650126005189923, 13.66108116025011, 13.636544222792033, 13.663746867549065, 13.626176670833402, 13.59824157968966, 13.674717201935882, 13.694557928731372, 13.727707429817114, 13.657670720998764, 13.54889394004633, 13.69650375543492, 13.692110648403906, 13.55263976838036, 13.630076360505104, 13.593884835135345, 13.596113596592723, 13.602738980430088, 13.490250965065599, 13.698940481247519, 13.583385809300575, 13.60991931296976, 13.581332737838016, 13.824623548139833, 13.533893973585819, 13.533775394793583, 13.755699578934374, 13.759936297399996, 13.87244513763899, 13.616014488643092, 14.09812993251356, 13.710074602518604, 13.91784066420223, 13.912311265620039, 14.203969619716446, 14.255022778711806, 14.830844952562549],
},
"2023": {
"x": list(range(1, 88)),
"y": [14.789164834058647, 14.780127256037884, 14.819678850556608, 14.733221736292204, 14.715123895744814, 14.569614305023329, 14.396346309952783, 14.267962672112828, 14.173985658599138, 14.070884007245896, 13.974284099164725, 13.918302031044524, 13.898843341205037, 13.879919458330534, 13.865098670719211, 13.851559827592494, 13.844906626448243, 13.827295800961403, 13.820810936762644, 13.809543815857673, 13.804536613446562, 13.804859924468062, 13.785889612091664, 13.802986923401033, 13.830453100698728, 13.816370948078971, 13.830157632336801, 13.839051100924063, 13.84746613758983, 13.860297269342437, 13.815378459306658, 13.812782079759149, 13.793416550465908, 13.815821643865219, 13.78691014152164, 13.740292216550131, 13.709841553660574, 13.745287154982947, 13.691633688757076, 13.67702798250515, 13.665734867137164, 13.660225685620617, 13.636580976940015, 13.658398179452709, 13.607051808944078, 13.641436611855841, 13.593798625450953, 13.61361178624699, 13.638190686281677, 13.646499055714083, 13.591038080776018, 13.622992917555028, 13.587839722276074, 13.630829824495837, 13.629461225299615, 13.592200956351647, 13.615680520490306, 13.630341745716859, 13.677426157763774, 13.626805264232148, 13.564525550141198, 13.67038341024563, 13.672981832082215, 13.525896811417093, 13.563993050553714, 13.611941675078645, 13.553760533281189, 13.59021111451196, 13.470082500603052, 13.59912543494902, 13.509683974597134, 13.521390742472398, 13.520602741034393, 13.725732516220367, 13.402650383856045, 13.482679094860476, 13.645693009561771, 13.775875527667997, 13.832068021284835, 13.498004659433413, 14.094763215759677, 13.660926796721734, 13.834609766490832, 13.863488794330497, 14.180579199558213, 14.222775721949759, 14.830844952562549],
},
}
fig = go.Figure()
# Add a line for each year
for year, values in data.items():
x_values = values["x"]
y_values = values["y"]
fig.add_trace(go.Scatter(
x=x_values,
y=y_values,
mode='lines+markers',
name=year
))
# Update layout
fig.update_layout(
title="Perplexity Across Different Dump Duplication Counts",
xaxis_title="Number of Dumps Duplication",
yaxis_title="Average Perplexity",
legend_title="Year"
)
# Show figure
graph6 = fig
#llama graph 1
import plotly.graph_objects as go
# Data for different years
data = {
"2014": [10.036774097041135, 9.306693996275795, 9.442327622499175, 9.015408185880002, 9.94583162297666, 9.141712571508352],
"2015": [9.46310273785878, 8.763464863196129, 9.075851726027564, 8.868392446242012, 9.113560631617027, 8.037411460181893],
"2016": [9.41413706166537, 8.645126825996691, 9.527148465147846, 9.120345162203675, 8.9228845723255, 9.14052983061081],
"2017": [9.50318602661455, 9.473904977192573, 9.755998086072951, 8.968012141869462, 8.895860780054043, 8.757970647106037],
"2018": [9.007669062339426, 10.95829859145081, 10.128151243953157, 9.451949410987668, 8.863879736723902, 8.440366034517687],
"2019": [8.388255660116407, 10.676105294328789, 9.728353939624842, 9.381837094065533, 8.401723232809463, 7.5705604983353325],
"2020": [10.112246017864624, 10.255251179892559, 9.233548505479437, 9.25131862646364, 8.458532176757009, 7.4808205167223525],
"2021": [10.239269162661959, 9.54987953569235, 9.067380903629866, 9.014261939731549, 8.14345667720481, 7.312019290288715],
"2022": [9.931951075969451, 9.12737570591033, 8.995868137602248, 9.00805668763514, 7.882044010499616, 7.538858258386088],
"2023": [8.646614152066428, 8.806922449908505, 8.816629232137835, 8.995152677487027, 7.737747701620713, 6.77703951001925]
}
# Buckets
buckets = ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"]
# Create the figure
fig = go.Figure()
# Add lines for each year
for year, perplexities in data.items():
fig.add_trace(go.Scatter(x=buckets, y=perplexities, mode='lines+markers', name=year))
# Update layout
fig.update_layout(
title="Perplexity Across Different Buckets",
xaxis_title="Bucket (duplicate count range)",
yaxis_title="Average Perplexity",
legend_title="Year"
)
# Show the figure
llama_graph1 = fig
##llama graph 2
import plotly.graph_objects as go
# Data for different years and buckets
data = {
"1-1": [10.036774097041135, 9.46310273785878, 9.41413706166537, 9.50318602661455, 9.007669062339426, 8.388255660116407, 10.112246017864624, 10.239269162661959, 9.931951075969451, 8.646614152066428],
"2-5": [9.306693996275795, 8.763464863196129, 8.645126825996691, 9.473904977192573, 10.95829859145081, 10.676105294328789, 10.255251179892559, 9.54987953569235, 9.12737570591033, 8.806922449908505],
"6-10": [9.442327622499175, 9.075851726027564, 9.527148465147846, 9.755998086072951, 10.128151243953157, 9.728353939624842, 9.233548505479437, 9.067380903629866, 8.995868137602248, 8.816629232137835],
"11-100": [9.015408185880002, 8.868392446242012, 9.120345162203675, 8.968012141869462, 9.451949410987668, 9.381837094065533, 9.25131862646364, 9.014261939731549, 9.00805668763514, 8.995152677487027],
"101-1000": [9.94583162297666, 9.113560631617027, 8.9228845723255, 8.895860780054043, 8.863879736723902, 8.401723232809463, 8.458532176757009, 8.14345667720481, 7.882044010499616, 7.737747701620713],
"1001-30000000": [9.141712571508352, 8.037411460181893, 9.14052983061081, 8.757970647106037, 8.440366034517687, 7.5705604983353325, 7.4808205167223525, 7.312019290288715, 7.538858258386088, 6.77703951001925]
}
# Years
years = ["2014", "2015", "2016", "2017", "2018", "2019", "2020", "2021", "2022", "2023"]
# Create the figure
fig = go.Figure()
# Add lines for each bucket
for bucket, perplexities in data.items():
fig.add_trace(go.Scatter(x=years, y=perplexities, mode='lines+markers', name=bucket))
# Update layout
fig.update_layout(
title="Perplexity Across Different Years",
xaxis_title="Year",
yaxis_title="Average Perplexity",
legend_title="Bucket (duplicate count range)"
)
# Show the figure
llama_graph2 = fig
#llama graph 4
import plotly.graph_objects as go
# Data for different years and dump duplications
data = {
"2014": {
"dumps": [1, 2, 3, 4, 5, 6, 7],
"perplexities": [9.73915022954687, 8.917501442736835, 10.870824235415164, 8.839485979263355, 9.114611185408386, 9.00595271327483, 9.069847072965578]
},
"2015": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14],
"perplexities": [9.219127989173247, 8.610711104284512, 8.505043568675715, 7.990039784261444, 8.107957918641446, 8.796945238229792, 8.013223752027935, 8.890635712836795, 8.83059261426682, 10.04094169141142, 8.570752850736193, 9.003542320883396, 8.587190578806105, 7.983045509484727]
},
"2016": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23],
"perplexities": [9.224890447512712, 8.982140506828461, 7.624091188629551, 8.97063321078077, 8.261724045845817, 7.793111396647548, 7.829316622145423, 8.597365842164928, 9.301981760525631, 9.66361415155858, 9.258511719598742, 9.441774097297651, 9.429412341325685, 9.325699904738741, 8.836147021549138, 8.607104273128627, 8.722839588316196, 8.920039351586981, 8.914454312645233, 8.899123060759182, 9.793833500279591, 10.134616145581552, 8.353063455545444]
},
"2017": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34],
"perplexities": [9.488743166894329, 9.683975569858143, 8.654505727247006, 8.066421362212841, 8.395709115228499, 8.500311197527102, 9.10900254771213, 7.794618707693523, 8.059130491102199, 7.840987528913394, 8.94443662009675, 8.811736884161157, 9.395950762255111, 8.88696403862443, 9.064476456994532, 9.474527237081157, 8.91858984698398, 9.008242064314263, 8.840440114974651, 7.978242830053041, 8.653702083122754, 9.395390940155544, 8.644847872201382, 9.017641716864084, 8.731668787167907, 7.294766100138992, 9.116288498873331, 8.812157001137116, 8.229244256822179, 10.705494840702238, 8.4287361645181, 9.127134117671186, 8.418280990577143, 8.223315656547781]
},
"2018": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46],
"perplexities": [9.896529727642656, 9.375668627700882, 9.53229676611742, 9.709666311696747, 9.371857870215996, 9.756320954898577, 9.3489352873219, 9.41874088848098, 9.220103832539115, 9.493717136086154, 9.894783254332049, 10.271325431375882, 9.444295310961042, 9.259722713114918, 9.121852071096205, 10.266770364074752, 9.322189177071575, 9.200133535506806, 9.391739906453976, 9.166754675924274, 9.386922783373333, 9.269174320074539, 8.921691129048623, 8.500872698966008, 8.427801104408742, 8.957096089538366, 8.843138224464884, 8.839757712227849, 8.730159045861498, 8.761283943113895, 8.955585790830773, 9.480108588809301, 8.975279317370992, 8.647350666497408, 8.040519395112794, 8.154306078995903, 9.047836211768528, 8.388013770335506, 9.27023552172876, 8.392778372966038, 9.698769530780428, 8.48774562040954, 9.832837942793894, 8.801856106666897, 9.090280166741453, 8.066384841477534]
},
"2019": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58],
"perplexities": [9.32068228893817, 11.36279410700072, 9.729296413744873, 10.951540717951199, 9.571599362297537, 8.746033912439227, 8.911359607667526, 8.652716464937903, 8.90908579802875, 9.526405246155608, 8.84494033246573, 9.45556467668226, 9.61666194147301, 9.471820461436957, 9.385272422926384, 9.300484355205835, 9.374562863672638, 8.921445075261644, 8.457279643164815, 8.911117277418406, 8.076917631172464, 8.58392948648068, 9.138574660565174, 9.03583800697058, 8.706482138788626, 8.581302039813796, 8.567006611519137, 5.454819541045107, 8.380493341695487, 8.129823277176698, 7.346580306828866, 8.182982036096053, 8.03219664626822, 8.434163783307083, 8.148075720769123, 8.20825575224898, 7.7034049100948945, 8.319494286475098, 8.449794025203127, 8.40448676995273, 8.394065958286836, 8.431905407945235, 8.684778696918817, 10.170628597487527, 7.685742913353763, 8.317540224765809, 7.100457493121143, 5.389889122637774, 6.52302432138372, 8.895820543553361, 8.540964121500908, 5.823656104193133, 8.946389481295038, 8.03972593805594, 7.406476375508138, 7.434287132433397, 8.592981328562821, 9.803727252301018],
},
"2020": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67],
"perplexities": [10.012609650486192, 7.943056443498068, 8.44096110442561, 9.029669769296477, 8.409724985539306, 8.731282990251563, 8.434833756562051, 8.497304934371442, 8.467244156051745, 8.606236488210545, 8.805728093624284, 9.375705002747582, 9.21767027458378, 9.048307919892986, 9.77562185114431, 8.730686261181575, 9.434356327584526, 9.119611839878791, 9.17722037907838, 8.569631235903184, 8.899794145233415, 9.315415673275877, 8.170599811786479, 8.538223762760031, 8.19667246899941, 8.740262061758479, 8.335448351341697, 8.321473204597588, 8.505543388481339, 8.552966240767482, 8.350236112276809, 8.109081033072668, 8.539929546398097, 8.535623890267809, 8.152345891530405, 8.399872141360548, 7.737922667873269, 8.15695720088359, 8.175043636189214, 7.595645045643389, 7.911222051300795, 8.645606075472527, 8.114112476153545, 8.054768997187903, 7.800103557084926, 8.096027154350947, 8.10653262234877, 8.029447458295808, 7.192697926255588, 9.370330492895473, 8.523467886567657, 7.313215625083473, 8.839958839301076, 8.656716147817143, 8.137974531785895, 8.523363904379156, 6.108894835851177, 7.818953624010673, 8.49431208395812, 8.342596121020756, 7.742470144320784, 6.682052985671971, 6.759804959168626, 9.093551460193316, 7.062030527371495, 8.434506543833649, 6.781692983120098],
},
"2021": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76],
"perplexities": [9.841089195168713, 8.366233239891208, 8.059521351436208, 8.318918468325863, 8.324706089968892, 8.32605366049384, 8.435930736985704, 8.66800508008913, 8.406990633173743, 8.962431358959584, 8.850717354466074, 9.1716199955458, 9.302688993535714, 8.939046098190769, 9.051679849424985, 8.682789687366284, 8.994991585405426, 8.561380912367396, 8.787500555168679, 8.843251281455629, 8.7217706466806, 8.381660448144187, 9.395216774912862, 8.591359926732526, 8.453429031525232, 8.456509570151965, 8.628116911794814, 8.53819222436614, 8.730438299562152, 9.376235492300244, 8.15154442462199, 8.54875158466325, 8.163866477674533, 8.304409143008455, 8.856929571720633, 8.167913697870857, 7.84492260274128, 8.162407286516313, 8.321838697740313, 8.253127215455834, 8.248563253933684, 8.499374467029739, 8.680742460396948, 7.967559876484448, 8.095069183089077, 7.912424470771882, 7.7624804836167565, 7.807769541801359, 8.016590141394108, 7.6555859978103316, 8.416070459989983, 7.512191560306614, 7.994576039964321, 7.185188422240499, 7.660311594811295, 7.23106290817905, 6.982644852723388, 7.843742555580493, 7.005057894403877, 8.430250121211994, 5.657881355879867, 6.726292542438366, 7.486937111190708, 7.712303495834796, 6.246962399681747, 6.92875404699629, 5.329766234792039, 5.709327997807491, 7.971206942045293, 5.686373279239376, 6.1781744792525615, 8.241084719551052, 8.439160967397711, 7.65310078654845, 6.327069191350794, 3.91910919080523],
},
"2022": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82],
"perplexities": [9.483592568856565, 7.189994228954454, 8.316909239194644, 7.86424678656687, 9.220674611582542, 8.321976529350732, 9.10888002884781, 8.225969911900018, 8.384237608546773, 8.780327271679809, 9.364145618644377, 9.495859713757827, 9.106949174218812, 9.23421176581141, 9.163921762844911, 8.794794461344875, 8.828930317074237, 8.910619607048394, 8.875861267417038, 8.806690212582172, 9.061056708418198, 8.866883414667015, 8.67286618308663, 8.682273027254936, 8.305102405030174, 8.189733511502775, 8.924337748216326, 8.659728319566609, 8.444422835653581, 8.755250021389994, 8.000000289145156, 8.081525926632303, 8.061721834769063, 7.895475427973516, 8.287032632326136, 8.472773038016852, 7.663326197885218, 7.847535650315383, 7.732755997953167, 7.960257016089297, 7.608447426559309, 7.598389147784626, 7.946761405541756, 7.773873549407202, 8.126908611820289, 7.916664649722816, 7.894622086606636, 7.680503580812927, 7.727898320658088, 7.432772901777352, 8.202398282489195, 8.042184753937285, 7.73548358717129, 7.682704039184239, 8.158164009607694, 7.345186708566949, 7.828163052277644, 7.611824744941703, 7.241808787698759, 7.582892852952833, 7.879397809151155, 7.134581497547041, 7.78667356422719, 6.656397614763345, 7.023352560594163, 7.362930730205023, 7.3699197483652386, 6.7454140379422265, 5.903262622771099, 6.434879224359672, 7.306608742238141, 7.9100884219615555, 7.924947631037447, 8.120669403708789, 7.8919156097528464, 7.295660656533646, 5.599201327007343, 5.260468504600074, 6.889443342018529, 5.396932289937023, 6.7357812331788285, 7.079240389198726],
},
"2023": {
"dumps": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87],
"perplexities": [8.70489099557147, 7.743567081947979, 5.707700759513075, 7.42267071929539, 7.528257194741652, 6.766266255314377, 8.140487690026744, 7.968460364579144, 8.378534732391445, 8.462864835761868, 8.750163467122363, 9.030159982511133, 8.947498611252533, 9.26185161266797, 9.148155404351185, 9.160868347246595, 9.132536983584458, 9.12916497406581, 9.027825944368539, 9.127169658958355, 9.087762413460762, 9.288851446582335, 9.21606664952798, 9.10292838042461, 9.142519978568224, 8.822355646917647, 8.900446619619732, 8.79981304565808, 8.918708459617246, 9.13267243596762, 8.759214105765599, 8.961577284078654, 8.12181490449537, 8.43888231714366, 8.724831350613316, 8.258762532936931, 8.337583232620341, 8.223678511207945, 8.19914152935067, 8.250449659843008, 8.488274186714182, 8.063794656047826, 8.267469501822353, 8.109403400519883, 7.897519766033864, 8.029859903259943, 8.01415790723292, 7.852726835204203, 7.524006414246027, 8.016485804552786, 8.181980185953115, 7.7865858384362445, 7.630488133713028, 7.744179998387641, 7.9618609986528766, 7.818104340203628, 7.873732400580378, 7.643522973769515, 7.743819932052891, 7.603304862075835, 7.499516191588959, 7.919857492185231, 7.294200517555408, 7.835098137549298, 7.562994060655124, 7.426074658906729, 7.4503303575596185, 7.6402144041645315, 6.889172499203354, 7.869082402525025, 7.476479798274207, 7.46012411648056, 7.016878527752248, 7.233305845472016, 6.657949958745544, 6.2352925881040875, 6.558931554888652, 6.094819134587699, 6.444696396841287, 5.338755088514068, 5.367611973164904, 5.425863412036782, 4.20042362030674, 5.111941016244413, 5.149295160813693, 3.9082208202377435, 2.6866750639387136],
},
}
# Create figure
fig = go.Figure()
# Add traces for each year
for year, year_data in data.items():
fig.add_trace(go.Scatter(x=year_data["dumps"], y=year_data["perplexities"], mode='lines+markers', name=year))
# Update layout
fig.update_layout(
title="Perplexity Across Different Dump Duplication Counts",
xaxis_title="Number of Dumps Duplication",
yaxis_title="Average Perplexity",
legend_title="Year"
)
# Show the figure
llama_graph4 = fig
#llama graph 5
# Data for different buckets and years
import plotly.graph_objects as go
# Data for different years and buckets
data = {
"2014": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.276942939297756, 8.69938211424056, 8.158271167692497, 8.367670702299348, 6.583755343348351, 7.497674909399879]
},
"2015": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.103981560121444, 8.198551019737206, 8.17752561770772, 8.233928498586414, 6.517481691960036, 7.3736492145399355]
},
"2016": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.023271012270133, 8.067050538323626, 8.150103850870096, 8.232721560484496, 6.3749350052179015, 7.350697996200808]
},
"2017": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.129487810210167, 8.290815319993621, 7.878257519772607, 7.98292071692709, 6.524893452272168, 6.918924770013169]
},
"2018": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.213411471804902, 7.89026459259236, 7.403516159589743, 7.556076611087452, 6.6509342133282745, 6.493818412135467]
},
"2019": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [8.96407327327958, 7.628975687395983, 7.036189728869401, 6.6349379440939895, 6.446837262269017, 6.086615106309735]
},
"2020": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.137673180826452, 7.794611238323424, 7.059198583303955, 6.82070782491814, 6.64418110544852, 6.271177318179787]
},
"2021": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.178752781806578, 7.70543845537127, 6.698443323550492, 6.472409310902069, 7.307749809853384, 6.782598533191676]
},
"2022": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [9.096031774523855, 7.652072280274248, 6.615135590934534, 6.239500427643811, 6.787412545253696, 6.99638904682498]
},
"2023": {
"buckets": ["1-1", "2-5", "6-10", "11-100", "101-1000", "1001-30000000"],
"perplexities": [8.728460642325789, 7.561677894180029, 6.194391269071906, 5.775947387872692, 6.054439209079063, 5.3384410032299]
}
}
# Create figure
fig = go.Figure()
# Add traces for each year
for year, year_data in data.items():
fig.add_trace(go.Scatter(x=year_data["buckets"], y=year_data["perplexities"], mode='lines+markers', name=year))
# Update layout
fig.update_layout(
title="Perplexity Across Different Buckets",
xaxis_title="Bucket (Duplicate Count Range)",
yaxis_title="Average Perplexity",
legend_title="Year"
)
# Show the figure
llama_graph5 = fig
##llama graph 6
# Data for different years and duplication counts
data = {
"2014": {
"duplicates": list(range(1, 88)),
"perplexities": [9.73915022954687, 8.920626670584653, 10.794318768046299, 8.843588010546013, 9.050843813116494, 8.930966597941875, 9.037282952268393, 8.861595199889763, 8.753115155540607, 9.750853693230052, 8.684437196297443, 9.220661575409212, 8.779997997083122, 8.395973456433415, 8.73217254093509, 8.881588084417483, 8.631494252144279, 8.819106667105284, 8.896815931063438, 8.659420224734506, 9.093486198999384, 9.696607960142106, 8.508805626033137, 8.770987058526325, 8.618185592039293, 7.915860238031309, 8.83767692043796, 8.727961757725632, 8.485070840013236, 9.764445257512499, 8.600757313466264, 9.081950235300344, 8.644217818204663, 8.55864241676558, 8.233431060928043, 8.184825012856324, 8.457157826105203, 8.306222356999731, 8.804352979539, 8.313005637251672, 9.026721732161297, 8.449083429742776, 8.733235778798473, 9.006749183049818, 8.200737283467852, 8.251897579249375, 7.787355375938481, 7.268723383407269, 7.571889349513068, 8.351626749016013, 8.400107029097354, 7.723260069861529, 8.064236740258659, 7.888157433279341, 8.148191006636575, 7.906415374915906, 7.676551458219022, 7.967158452060384, 7.932665786459153, 7.9763750026305305, 7.667885913458702, 7.839381126838969, 7.92098160290061, 8.028601269205508, 7.563111341601447, 7.6678178481341215, 7.111641341466761, 7.42738813332767, 6.926910421359465, 7.363397686520664, 7.4639497513997775, 7.970748152252673, 7.356418997104175, 7.343504223513313, 6.8766667549967355, 6.358501202955649, 6.424115736059589, 6.008071046749611, 6.639372134895001, 5.6177395770356835, 5.443864799344331, 5.6647930543792, 4.172380654474099, 5.128083927608737, 5.146055825516793, 3.8998212782432287, 2.6866750639386963],
},
"2015": {
"duplicates": list(range(1, 88)),
"perplexities": [9.219127989173247, 8.662048439524266, 8.38989056455147, 7.962841520680627, 7.9129221891669, 8.601740522408205, 7.072072698161579, 8.547935092167322, 9.032202360967963, 9.644330594119374, 8.8352494084492, 9.04389212105191, 8.887379409385023, 8.467909602302054, 8.822876185378563, 8.655601459122618, 8.73446662907839, 8.858527575243034, 8.884133792160123, 8.489950876265588, 9.093447553065644, 9.577116330804195, 8.564448599529959, 8.758142067509203, 8.56227523869569, 7.897451823056177, 8.780353272984362, 8.69589044489135, 8.469444871399634, 9.707586741035607, 8.549040139041137, 9.062827976790162, 8.645009864743498, 8.544819434495203, 8.218203612587951, 8.191690418776773, 8.42249826138689, 8.296810827637307, 8.760096580513409, 8.3252124274653, 8.992877987118824, 8.454953276821902, 8.699916032688582, 8.953715077645272, 8.181603571788644, 8.193005628373307, 7.792425191978106, 7.2744004758877745, 7.554966996453596, 8.35034561406835, 8.41512904956328, 7.684576106312188, 8.064672849239695, 7.937226299628162, 8.236727165389356, 7.824011302908751, 7.622715782362401, 7.960707630747855, 7.932794820691164, 7.929912243495168, 7.655015402069077, 7.962802955194318, 7.851307904639461, 7.964993709642837, 7.551712280758451, 7.708432510205161, 7.1666588182507835, 7.3873387045347325, 6.911323642701545, 7.47032697252429, 7.5402879073116535, 7.826497044764086, 7.269655663988105, 7.343193140755126, 6.732955100033813, 6.447813049685099, 6.444597512230532, 6.007330197959276, 6.503017736395001, 5.297028390356502, 5.425460792319903, 5.536870445249572, 4.171727106880239, 5.112414745674864, 5.144884382794889, 3.914611382312465, 2.6866750639386963],
},
"2016": {
"duplicates": list(range(1, 88)),
"perplexities": [9.224890447512712, 8.865209727234555, 7.716537450318067, 8.505567000250219, 8.231186376526843, 8.439303045267778, 7.877163015312243, 7.994466878194956, 8.658354490436203, 8.525931733072895, 9.410755179427637, 9.700628031783868, 8.99451144975165, 9.002303200677753, 9.126870672453386, 9.422070510449645, 8.936682491853515, 8.911484811267863, 8.891667216351042, 8.666177883702614, 9.155910144590026, 9.594754908402185, 8.621298759427466, 8.787852330773674, 8.7227109238452, 7.982914897395895, 8.878126149070932, 8.717610707273684, 8.500066718763687, 9.77299952938655, 8.484499188420418, 9.006429013502562, 8.589528938847574, 8.48246092046138, 8.167057989146516, 8.171040607118929, 8.37171605234296, 8.266790595091017, 8.734798864250555, 8.29240112699872, 8.963302188522936, 8.41185193834277, 8.658957651571432, 8.923242538915662, 8.078070177365753, 8.153012171180952, 7.737730977556822, 7.323638159806731, 7.59168066096202, 8.37506434888842, 8.423868629202383, 7.671655504568603, 8.065075392658766, 7.976138380650688, 8.205116203468345, 7.81671515229199, 7.552886431000103, 7.904920126191346, 7.86434557317493, 7.888281162416497, 7.619817540814656, 7.956601658437982, 7.850774863461917, 8.024547071152215, 7.517340246604877, 7.638602768798686, 7.109799072356206, 7.351570828393637, 6.931128546796388, 7.506046773490761, 7.4664617315330455, 7.669725603465176, 7.254794269540855, 7.3180585905711455, 6.736605721220725, 6.380176442621056, 6.484391243201081, 6.037335383847396, 6.5047803196868665, 5.393419865823429, 5.382493790662867, 5.530611638476127, 4.195599613009973, 5.12749648121783, 5.162191190570913, 3.916322213479375, 2.6866750639387456],
},
"2017": {
"duplicates": list(range(1, 88)),
"perplexities":[9.488743166894329, 9.898479048180542, 8.696778620360424, 8.366687823872034, 8.630884650266044, 8.676086291852428, 9.334997107239593, 9.185879201546161, 8.84595356333466, 9.393437387426701, 9.45406621593655, 9.624060249862962, 9.532091483098174, 9.28384082428477, 9.469552273926178, 9.409055052262094, 9.358522040360171, 9.297106280140776, 9.073575169188139, 9.100944640377902, 9.23197269860482, 9.245904776150217, 9.170311706541447, 8.910824090510237, 8.795205662257203, 8.552457741951807, 8.930826813105282, 8.265717221808657, 8.603004747276188, 9.612646939458466, 8.552662222672813, 8.998548290935052, 8.560421893590284, 8.474723014427948, 8.206627804901014, 8.223373542290199, 8.398403355144557, 8.287572376736062, 8.754052702949243, 8.299825024291893, 8.941167619680243, 8.415160982913156, 8.638716545065352, 8.848352711284978, 8.027616325562285, 8.215417483840307, 7.796294849683444, 7.352280888696609, 7.632599613586875, 8.212116380094994, 8.36906213664436, 7.611956268590032, 7.998619733141829, 7.856761646868557, 8.045287904958364, 7.748316066259832, 7.501006529761084, 7.741538102662183, 7.751563576545041, 7.770809347580409, 7.433360335360308, 7.521045712972479, 7.342706611396849, 7.668010856653189, 7.324083777740233, 7.408132498092624, 7.120381253454176, 7.197819855700191, 6.845740773242076, 7.434903892374942, 7.30172469589484, 7.572324587463354, 7.2429522069242855, 7.407759480504424, 6.731089619105264, 6.270051935102005, 6.3655986521155326, 6.030460569178489, 6.450442179508357, 5.330140935634091, 5.408213974705514, 5.4956074785168365, 4.202359666343794, 5.132012988189369, 5.155812750486333, 3.917511891854019, 2.686675063938749],
},
"2018": {
"duplicates": list(range(1, 88)),
"perplexities": [9.896529727642656, 9.291082874617985, 9.691247942464267, 9.726042361988922, 9.023219233278645, 9.828083681879585, 9.061982292637602, 9.222594755383295, 9.221127620511943, 9.147737783035632, 9.217942333429908, 9.539190089929702, 9.468073594196243, 9.437273531098606, 9.435014041935224, 9.273790337174349, 9.396223055633108, 9.287408522624531, 9.106775224145558, 9.116191168902963, 9.237111779685268, 9.209051051549245, 9.222483610869865, 9.135002988610983, 8.788784301843895, 8.934854040474761, 9.017725654773155, 7.556551156032443, 8.798309646970585, 9.013026921998197, 8.454361664597716, 8.74055667139578, 8.44422407689182, 8.32983201978779, 8.359235182862202, 8.353476542703998, 8.197721584268855, 8.26450576475226, 8.595793902257883, 8.225557269937037, 8.826470933221817, 8.293081795411524, 8.570012186388858, 8.770785639469723, 7.88712952313622, 8.04581707470935, 7.626361664897192, 7.1029187216659935, 7.320944236203329, 8.070993423549334, 8.27396015964389, 7.3820727875281875, 7.903671423277116, 7.7618204686483825, 7.827655269209816, 7.675624293658499, 7.264953900477738, 7.583393879771943, 7.602901960669463, 7.671533291630901, 7.276738084631234, 7.3453361167238915, 7.135545835325713, 7.485342152740761, 7.167623169217046, 7.381420434659487, 7.025242147597371, 7.069891649575291, 6.69865442435757, 7.328644984573098, 7.258232298527563, 7.535910329008589, 7.255533113180425, 7.560918656956746, 6.666615954230938, 6.221938216559355, 6.336678407141162, 6.054298848202251, 6.548775617064581, 5.321650356255492, 5.4358231429446455, 5.421178189821786, 4.244486836711896, 5.109567298910753, 5.17074725626889, 3.9038325478573555, 2.6866750639387633],
},
"2019": {
"duplicates": list(range(1, 88)),
"perplexities": [9.32068228893817, 11.395142057563769, 9.418956531524783, 10.900691920426821, 9.438262555370176, 8.884239866713687, 9.062124035437813, 8.50267614928243, 8.638876645072413, 8.686925644350039, 8.714235065140539, 9.113035752580663, 9.125236586170647, 9.163963570975344, 9.25494911293901, 8.935379208998043, 9.225725827052665, 9.033303873966254, 8.950682642906997, 8.903920653639469, 8.911229320689435, 9.015000200687188, 9.096624316542014, 9.016863768067717, 8.737328799715891, 8.788723623351723, 8.932436150017006, 7.699853163934218, 8.707767111902166, 8.95646015823901, 8.35912690813594, 8.398373212501705, 7.932236470700611, 8.161242760113705, 8.609004455587062, 8.226779586405538, 7.842118333008395, 7.9881363454553, 8.036089351408874, 7.920609938080794, 7.95212600254153, 7.579485372600602, 7.88538668960003, 7.9594135744662236, 7.514800487806593, 7.689464139444159, 7.7544565651227, 7.41897302703282, 7.214254081876507, 7.895563781767841, 8.100226164186843, 7.272920541743749, 7.915118433849716, 7.658091861348199, 7.791626057064827, 7.627133141656945, 7.251831253315811, 7.569422424576574, 7.4906231710283935, 7.624606161129255, 7.152179142613762, 7.400538018976905, 6.9780334804483495, 7.455001719017696, 7.07739603554367, 7.201520909070617, 6.8033512129548726, 6.932923527827607, 6.796367425560507, 7.349719615399371, 7.290546797526088, 7.5224745941917055, 7.234885644016566, 7.373214375228053, 6.746192846100825, 6.23400120737243, 6.33988992018498, 6.030827322485673, 6.526425922427022, 5.371781592457229, 5.52171375482226, 5.521789795055974, 4.281913900699859, 5.135628510388279, 5.198507257987441, 3.9021738986547896, 2.6866750639387633],
},
"2020": {
"duplicates": list(range(1, 88)),
"perplexities": [10.012609650486192, 7.996780616269575, 8.486989186126861, 8.589723559690643, 8.39765295502809, 8.493985763693104, 8.444565685004276, 8.521057974766807, 8.262640776205831, 8.635134709906502, 8.811211245843253, 9.235066189908858, 9.022297426838923, 9.050058439072979, 9.021682564717057, 8.873493708246608, 9.015417293624877, 8.740954222830077, 9.0380883860745, 8.889091357432216, 8.912750014641842, 8.882441443817264, 8.998337842644444, 8.921169948677084, 8.691071558938896, 8.49208784075201, 8.776939087082413, 8.594979421555715, 8.72886934455455, 8.995731720491424, 8.421636184069852, 8.47617010726572, 7.749949346989389, 8.161269940208024, 8.744952692782391, 8.32025892064496, 7.869262480191432, 8.000847753164901, 8.076273972096198, 8.032342430082904, 7.983041009058366, 7.653597631636462, 7.975156835319908, 7.737411017432282, 7.605514142199969, 7.787824887059794, 7.857457978446249, 7.633203676037199, 7.047268036460168, 7.690311434532034, 8.040577048529848, 7.389586464023044, 7.740869008676299, 7.609659150626595, 7.837672584415724, 7.612754624743091, 7.287910254959312, 7.626199197144874, 7.319186118558612, 7.7127748347332385, 6.954623517457656, 7.486793070503545, 7.0394625786365, 7.450374675494852, 7.127267484316468, 7.250906351593999, 6.786363739265897, 6.980573512727148, 6.941463773809052, 7.423486191350063, 7.318743327632096, 7.629349084770016, 7.28811046001031, 7.435335626891362, 6.787682578185395, 6.222443482377916, 6.382107628208513, 5.9634307406816855, 6.574337724456447, 5.299637438768189, 5.445760462611284, 5.536805681860065, 4.174658965854665, 5.1170397769906595, 5.103551563888967, 3.9064523489117278, 2.6866750639387456],
},
"2021": {
"duplicates": list(range(1, 88)),
"perplexities": [9.841089195168713, 8.376002975517325, 8.380380483628153, 8.188986954093957, 8.498635277059357, 8.023999615729231, 8.382569297820478, 8.547323342280805, 8.188133428925276, 8.92217442481792, 9.176245490194058, 9.243284040091787, 9.034153905594078, 9.202098403867247, 9.134743272368441, 8.987006737157861, 8.92449319257734, 8.825574314893755, 8.847995893024844, 8.941295135829169, 8.987413373621635, 8.946047635293768, 8.910627453693433, 8.788838301728244, 8.76786062380576, 8.382956738298825, 8.699642493063092, 8.653055171884096, 8.740110731986059, 8.962375284828505, 8.333692265451546, 8.538371629422324, 7.61125418543177, 8.043172182416328, 8.716508021173402, 8.108788324737684, 7.9519597656706695, 8.013683771558808, 8.146173728648037, 8.096827091707578, 8.084160146852566, 7.625363299166386, 8.20296870216023, 7.82588401311041, 7.70124082508177, 7.78873594093791, 8.037661887779432, 7.5026482593453085, 7.087004259771732, 7.513718369391617, 8.138555082388203, 7.544675643417071, 7.6985222025131135, 7.620353449057761, 7.677585788165064, 7.607561443995849, 7.675688681631018, 7.426483327070772, 7.298729035123734, 7.597011886621879, 7.054853268704371, 7.2720630088080185, 6.999536763473811, 7.4649197409435155, 7.188519614053191, 7.05059392608445, 6.8880258512600125, 7.233553654860446, 6.863558927804786, 7.576343786143615, 7.169748797692396, 7.360833458217927, 7.151198016478686, 7.209746838078912, 6.785065344185751, 6.1445251557486005, 6.316811670053038, 5.861969568678405, 6.340724036900801, 5.198467430353175, 5.459134505462628, 5.462830131530051, 4.189086813428227, 5.114653776848574, 5.111679826185254, 3.920071733342082, 2.6866750639387456],
},
"2022": {
"duplicates": list(range(1, 88)),
"perplexities": [9.483592568856565, 7.19946566373024, 6.689435696789969, 7.735695023912755, 8.891994985807424, 7.974675072464074, 8.38103445140788, 7.767845780936468, 8.394625582114237, 8.433832557729854, 8.774679671114042, 8.974690045840946, 8.970427821588581, 9.259164010333704, 9.106573684091558, 9.082142024590542, 9.00694910652822, 8.951939452627803, 8.834410968583011, 8.976270078171723, 8.9788747911979, 9.147340358822175, 8.94766754786145, 8.863791307783835, 8.876434772786448, 8.537925507030351, 8.824632718943558, 8.670890722043863, 8.713248499915446, 8.991496303395792, 8.497388391287544, 8.694429166461068, 7.660306866593211, 8.063103914688337, 8.463798472858477, 8.147225054222934, 7.98918792448372, 8.129552622440363, 8.156552658413169, 7.993772322199681, 8.077300760319622, 7.687003596840271, 8.216734207325837, 7.818779874173861, 7.784873713139422, 7.841502120166083, 8.009056410739252, 7.643507378655463, 7.027652318922246, 7.578018517117392, 8.21806831598481, 7.738109238050354, 7.657938120144026, 7.670918897910402, 7.789453032753468, 7.6784988295976015, 7.758997892938832, 7.354548111787801, 7.324563987410127, 7.542453103467507, 7.082203068171782, 7.41432116627747, 6.902549671764324, 7.489234680249967, 7.354679134462809, 6.977235447939879, 7.297608588934183, 7.439224077591953, 7.01074155919995, 7.77157588876759, 7.452660719169145, 7.206525557457038, 6.837175958650314, 6.816276605521482, 6.841636273605858, 6.4126962333247475, 6.544729510231483, 5.84044063139556, 6.384392701668377, 5.342064638285962, 5.449806194943077, 5.550638967579051, 4.188085941944831, 5.167854549955437, 5.137630179031516, 3.901881866936028, 2.686675063938701],
},
"2023": {
"duplicates": list(range(1, 88)),
"perplexities": [8.70489099557147, 7.580704259900713, 5.836272117595713, 7.267518477506005, 7.283085974734155, 5.803062744865375, 8.134525344019872, 7.557124524037357, 8.285446726695811, 8.351123312334009, 8.590647921692078, 9.005573576795152, 8.871116907846343, 9.192666716497001, 9.005592946042935, 9.143088639505718, 9.091899749285021, 8.968510745275767, 8.975056578670769, 9.091779598794488, 8.980027479169559, 9.159988763765217, 8.883393229479356, 8.874910963718058, 8.931427901889217, 8.625523963019026, 8.735000607943736, 8.63742312596692, 8.70111762921543, 9.206595504882097, 8.763642440521853, 8.911783192379705, 7.634828216241755, 8.259433628637158, 8.82001651315211, 8.107726825798297, 8.206921799311043, 8.355228813696131, 8.298238657805719, 8.033613885206083, 8.225747435920205, 7.934196000879481, 8.286077333650876, 7.980486854114626, 7.721311081423362, 7.689565789535576, 7.790611228082437, 7.624460645122273, 7.0093123271820055, 7.791169711054489, 8.14175443228974, 7.776459425768002, 7.526576191153727, 7.756713091828537, 7.801566191856336, 7.843167604084829, 7.7089466527367705, 7.409181212687685, 7.442037119594963, 7.337342474375209, 7.190330728288846, 7.254100247522111, 6.79586626781295, 7.483337535174346, 7.294262214559599, 7.030373799134058, 7.149000704995256, 7.324234704301861, 6.822226914595191, 7.792044674564248, 7.149607692275065, 7.078295043693808, 6.946740616609221, 6.700263270499871, 6.4699642011179925, 6.359739677958311, 6.494171402228005, 5.966063278273302, 6.15136761591695, 5.309723356734837, 5.00827796373236, 4.976659481606136, 4.042120043465434, 4.842002060938444, 5.114027203055052, 3.8900363946754233, 2.6866750639387074],
},
}
# Create figure
fig = go.Figure()
# Add traces for each year
for year, year_data in data.items():
fig.add_trace(go.Scatter(x=year_data["duplicates"], y=year_data["perplexities"], mode='lines+markers', name=year))
# Update layout
fig.update_layout(
title="Perplexity Across Different Dump Duplication Counts",
xaxis_title="Number of Dumps Duplication",
yaxis_title="Average Perplexity",
legend_title="Year"
)
# Show the figure
llama_graph6 = fig
##txt360 vs fineweb comparison table
dataset_comparison = pd.DataFrame(
{
"Metric": [
"BoolQ",
"PIQA",
"HellaSwag",
"Winogrande",
"MMLU",
"Natural Questions",
"TriviaQA",
"GSM8K",
"MATH",
"MedQA",
],
"TxT360 - Upsampling": [
"70.31",
"80.36",
"73.54",
"68.43",
"30.26",
"22.22",
"58.52",
"3.41",
"28.04",
"25.61",
],
"FineWeb": [
"71.5",
"82.1",
"79.46",
"70.96",
"28.5",
"19.03",
"36.65",
"5.31",
"29.65",
"27.26",
],
"TxT360 Difference": [
"(1.19)",
"(1.74)",
"(5.92)",
"(2.53)",
"1.76",
"3.19",
"21.87",
"(1.9)",
"(1.61)",
"(1.65)",
],
}
)
styled_table = (
dataset_comparison.style.applymap(
lambda _: "background-color: #E1EEDB", # Green background for "TxT360" and "AnotherColumn"
subset=pd.IndexSlice[:, ["TxT360 - Upsampling", "TxT360 Difference"]] # Apply to both columns
)
.applymap(
lambda _: "background-color: white", # White background for all other columns
subset=pd.IndexSlice[:, dataset_comparison.columns.difference(["TxT360 - Upsampling", "TxT360 Difference"])] # Apply to all columns except "TxT360" and "AnotherColumn"
)
.hide(axis="index") # Hide the row index
)
table_html = styled_table._repr_html_()
table_div_1 = Div(NotStr(table_html),
style="display: flex; justify-content: center; align-items: center; width: 100%; max-width: 100%; height: auto; overflow-x: auto;"
)
intro_div = Div(
H2("TxT360 Studies"),
H3("What This Section Contains"),
P("This section shows the learning curve when pre-training on TxT360, with a proper upsampling approach. We compare several simple strategies and demonstrate that one particular upsampling method, inspired by the natural data distribution, performs exceptionally well. In our preliminary experiments, the model learns significantly faster on TxT360 compared to a similarly scaled dataset, FineWeb, on several important evaluation metrics. We believe that a more carefully designed upsampling strategy could further enhance the use of our data."),
P("In addition to the training results, we also provide an analysis of the dataset, including perplexity trends over time across the CommonCrawl snapshots. This section is organized into the following topic areas:"),
Ul(
Li("The Learning Curve of TxT360 with an Upsampling Recipe", style = "margin-bottom: 5px"),
Li("Perplexity Analysis across time", style = "margin-bottom: 5px"),
Li("Topic Analysis on Data Cluster Groups", style = "margin-bottom: 5px"),
Li(B("Estimated Reading Time: 25 minutes"), style = "margin-bottom: 5px"),
),
)
upsampling_exp = Div(
H2("A Simple Data Mix Creates a Good Learning Curve"),
P(
"As discussed in prior sections, duplicated documents can significantly reduce training efficiency (i.e., the ratio of model performance to the number of pre-trained tokens). Previous work, such as RefinedWeb",
D_cite(bibtex_key="refinedweb"),
", emphasizes the importance of deduplication. Recently, the FineWeb study conducted an interesting analysis, comparing LLM performance when pre-trained on globally deduplicated versus locally deduplicated datasets. They found that training efficiency with a globally deduplicated dataset can be worse",
D_cite(bibtex_key="fineweb"),
". Fineweb hypothesize that global deduplication may remove a higher proportion of high-quality documents."
),
P(
"This finding led us to consider that a pre-training corpus based on crawled websites is naturally upsampled for a variety of reasons. For example, commonly used templates or boilerplates may appear millions of times; a well-regarded article reposted by different users may surface across multiple sites; and the same web pages, crawled by CommonCrawl at different times, will duplicate each other. The reasons behind these duplications vary: some may serve as indirect indicators of high-quality content, while others may not. Therefore, curating a pre-training dataset should involve leveraging these signals and considering data weighting schemes — or at the very least, provide users with the necessary information to control it effectively."
),
P(
"To this end, we store rich metadata for each document source, including features like user votes from StackExchange. One crucial piece of metadata is the number of duplicates detected for a document. This information allows users to reconstruct the natural web distribution, but more importantly, we will demonstrate that a simple upsampling recipe based on this metadata can create a high-quality data mix."
),
H3("Experiment Setup"),
P(
"Motivated by the FineWeb study, we opted to upsample documents based on their natural distribution. However, since duplication is only an indirect indicator of quality, we upsample documents to a few predefined levels rather than using their exact count. Specifically, we set the upsampling weight to 3 for documents with 2 to 5 duplicates, 5 for those with 5 to 100 duplicates, 8 for 101 to 1000 duplicates, and 10 for documents with over 1000 duplicates. These values were selected heuristically and informed by preliminary small-scale experiments. For non-CommonCrawl data sources, we assign a weight of 2 if the document appears more than once. This straightforward approach results in a corpus exceeding 15 trillion tokens, making it one of the largest open-access pre-training datasets available."
),
P(
"To evaluate the training efficiency of our dataset, we sampled 1.5T tokens from both FineWeb and TxT360 (using the aforementioned weighting) and conducted a training ablation on an 8x8B Mixture-of-Experts architecture, similar to Mixtral. We compared the learning curves by tracking training loss, validation scores, and performance across a wide array of diverse evaluation benchmarks. The validation set was sampled independently from SlimPajama",
D_cite(bibtex_key="cerebras2023slimpajama"),
". Note that this experiment is done on a slightly earlier version of the dataset."
),
H3("Learning Curves on the Evaluation Metrics"),
P(
"Evaluation results are the most direct indicator of model quality. We assess the intermediate results of the models across multiple metrics and plot the learning curves. Our findings indicate that the model learns significantly faster with TxT360. For a fair comparison, we evaluate TxT360 against FineWeb using only the CommonCrawl data sources, and we also show the curves after incorporating the 14 curated sources and coding data (Stack V2), demonstrating the full potential of the dataset. Due to computation resource constraints, we stop running experiments when we can observe clear trends."
),
P(
"Based on the metrics, we find that TxT360’s CommonCrawl portion with the umsampling strategy outperforms FineWeb on key metrics at MMLU, NQ, falls slightly behind on HellaSwag. Furhter, we show that by combining TxT360 with coding data (Stack V2), the learning curve is significantly more stable and we observe improved results across most all of the metrics. Apparently the dataset preference here may depend on the set of metrics one would use."
),
plotly2fasthtml(all_eval_res_figs["MMLU"]),
plotly2fasthtml(all_eval_res_figs["NQ"]),
plotly2fasthtml(all_eval_res_figs["HellaSwag"]),
P(
"Similar to the findings in DCLM, adding the curated non-CommonCrawl data sources produces mixed results (some preliminary figures are not shown here). Yet such data can help with domain specific tasks like MedQA."
),
plotly2fasthtml(all_eval_res_figs["MedQA"]),
plotly2fasthtml(all_eval_res_figs["PIQA"]),
plotly2fasthtml(all_eval_res_figs["TriviaQA"]),
plotly2fasthtml(all_eval_res_figs["WinoGrande"]),
H3("Comparing the Loss Curves"),
P(
"We also plot the training and validation loss curves for each dataset, showing that TxT360 achieves both lower training and validation losses compared to FineWeb. Although training loss may not correlate directly with final model performance, we observe that the loss curve for TxT360 exhibits fewer spikes compared to FineWeb, indicating more stable training dynamics."
),
plotly2fasthtml(lm_loss_graph),
plotly2fasthtml(validation_loss_graph),
)
preplexity_intro_div = Div(
H2("Perplexity Evaluation on Duplicate Data"),
H3("Model based Quality Estimation"),
P("We took one of the model-based data quality evaluation strategies adopted by ", A("DataComp-LM",href="https://arxiv.org/abs/2406.11794"), " which used perplexity filtering as a candidate for quality filtering. The DCLM results show that a simple perplexity filter is still quite strong. DCLM followed ", A("CCNet’s",href="https://arxiv.org/abs/1911.00359"), " practice to use a 5-gram Kneser-Ney model as implemented in the ",A("KenLM",href="https://github.com/kpu/kenlm"), " library for efficient perplexity calculation. In order to gain more insights of our dataset, we also took a ", A("KenLM model",href="https://huggingface.co./edugp/kenlm"), " trained on English Wikipedia data to compute perplexity on data with different duplication patterns, and try to observe how such signals coorelate with the duplication patterns."),
H3("Sampling Strategy"),
P("We took a early version of the TxT360 Common Crawl (CC) portion, and bucket the documents by the number of duplicates each has. For each CC snapshot, we bucket the documents by their duplicate counts in the following buckets (1, 2-5, 6-10, 11-100, 101-1000, 1001-infinite). We sampled the first 10k documents from each bucket."),
)
perp1_div = Div(
# this looks basically the same as the figure below, comment it out for now.
# Section(
# H3("Perplexity vs Buckets"),
# P("For each bucket, we aggregated all the chunks that belong to a single year and calculated the average perplexity for each (bucket, year) data point. We observe the perplexity is generally dropping. This could be biased since we always keep the newest document if we find a duplicate."),
# #Img(src="images/prep-diff-buckets-global.png", height = "300", width = "600" ),
# plotly2fasthtml(Perplexity_Across_Different_Buckets_global_graph),
# ),
Section(
H3("Perplexity vs. Years"),
P("Taking the same data, we can convert it into a graph indicating the yearly trend. For most buckets, the average perplexity of dumps from more recent years seem to be lower than that of former years. This could be biased since we always keep the newest document if we find a duplicate."),
#Img(src="images/prep-across-diff-year-global-dup-buckets.png", height = "300", width = "600" ),
plotly2fasthtml(graph2222),
),
Section(
H3("Perplexity vs. Document Duplication"),
P("Instead of bucketing, we also plot the relationship between perplexity versus the number of duplicates directly. The graph becomes a bit noisy at the end because of insufficient samples with larger duplication counts. However, we can observe that there seems to be a lower point at around 10-20 duplicates. To see the results more clearly, we recommend you turn of other years and only look at one year, and zoom in to 0-100 region on the X axis."),
#Img(src="images/prep-across-diff-docs-dup-count-global.png", height = "300", width = "600" ),
plotly2fasthtml(graph3),
),
Section(
H3("Perplexity vs. Dump Duplication"),
P("Fineweb hypothesize that documents appear across multiple snapshots (CC dumps) might be an indicator of quality. Hence, we also plot the perplexity versus the number of times a document appear in different snapshots. From the graph below we can see that documents that are duplicated across around 40 - 60 snapshots usually have lower perplexity."),
#Img(src="images/prep-across-diff-dump-dup-counts-global.png", height = "300", width = "600" ),
plotly2fasthtml(graph4),
),
Section(
H3("Perplexity Plots before Global Deduplication"),
P("Previously we have seen that documents in recent snapshots tend to have lower perplexity. This might be related to the way how global deduplication was implemented. During global deduplication, we only keep copy in the latest dump. Hence documents that are duplicated across multiple dumps only appear in the latest one. To avoid bias brought by this strategy, we tried to recover the states before the global deduplication using the stored metadata (i.e., the locally deduplicted dataset state). This trends are a bit different. In the figure below, we do not observe a clear trend of which year has a higher quality, especially in the 2-10 bucket region."),
#Img(src="images/prep-across-diff-buckets-local.png", height = "300", width = "600" ),
plotly2fasthtml(graph5),
),
Section(
H3("Perplexity vs. Dump Duplication before Global Deduplication"),
P("Following the same practice, we can plot the graph of average perplexity with respect to dump duplication count, before global deduplication. The conclusion is similar, that documents with a dump duplication count around 40-60 have the lower perplexity."),
#Img(src="images/prep-diff-dump-dump-counts-local.png", height = "300", width = "600" ),
plotly2fasthtml(graph6),
),
)
llama_div = Div(
Section(
H2("Llama 3.1 8B"),
P("For comparison purpose, we run the same perplexity evaluation with llama 3.1 8B model."),
),
Section(
H3("Perplexity vs. Buckets"),
#Img(src="images/perp-across-diff-buckets-global.png", height = "300", width = "600" ),
plotly2fasthtml(llama_graph1),
),
Section(
H3("Perplexity vs. Years"),
#Img(src="images/prep-across-diff-years-global.png", height = "300", width = "600" ),
plotly2fasthtml(llama_graph2),
),
Section(
H3("Perplexity vs. Dump Duplication"),
#Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
plotly2fasthtml(llama_graph4),
),
Section(
H3("Perplexity vs. Buckets before Global Deduplication"),
#Img(src="images/prep-diff-buckets-local.png", height = "300", width = "600" ),
plotly2fasthtml(llama_graph5),
),
Section(
H3("Perplexity vs. Dump Duplication Count before Global Deduplication"),
#Img(src="images/prep-vs-dump-dup-global.png", height = "300", width = "600" ),
plotly2fasthtml(llama_graph6),
),
)
with open(os.path.join(os.path.dirname(__file__), "data", "topic_charts.json"), 'r') as f:
topic_charts = json.load(f)
topic_graphs = []
for title, data in topic_charts:
if data["type"] == "barh":
topic_graphs.append(go.Figure(go.Bar(
x=data["kwargs"]["width"],
y=data["kwargs"]['y'],
orientation='h',
marker_color=[
"rgb(" + ", ".join(str(val * 255) for val in rgb) + ')'
for rgb in data["kwargs"]["color"]
]
)))
elif data["type"] == "pie":
topic_graphs.append(go.Figure(go.Pie(
values=data["kwargs"]['x'],
labels=data["kwargs"]["labels"],
marker_colors=[
"rgb(" + ", ".join(str(val * 255) for val in rgb) + ')'
for rgb in data["kwargs"]["colors"]
]
)))
cluster_div = Div(
Section(
H2("Topic Analysis"),
P("In order to understand our dataset better, we tried to cluster our data into topic groups and examined for correlations between topics and other attributes of the documents. We suspect documents from different topic groups should manifest different characteristics of distribution, which can give us some insight into the composition of dataset."),
H3("Methodology"),
P("We took an early version of the LLM360 Common Crawl portion and clustered them into 17 topic groups using ", A("BERTopic", href="https://maartengr.github.io/BERTopic/index.html"), ". We collected and aggregated a series of metrics from the stored metadata. For each topic group, we calculated average scores and generated the corresponding bar charts over different metrics for comparison and analysis."),
H3("Cluster Groups"),
P("We grouped data into the following 17 clusters. These clusters are obtained by first clustered a seed portion of the dataset into 128 dumps, and then we manually inspect the clusters to combine 17 semantically meaningful ones."),
Ul(*(
Li(topic_name, style = "margin-bottom: 5px")
for topic_name in ("Arts", "Business & Economics & Finance", "Culture & Cultural geography", "Daily Life & Home & Lifestyle", "Education", "Entertainment & Travel & Hobby", "Environment", "Food & Drink & Cooking", "Health & Wellness & Medicine", "Law & Justice", "Natural Science & Formal Science & Technology", "Personal Development & Human Resources & Career", "Politics & Government", "Religion & Spirituality", "Shopping & Commodity", "Society & Social Issues & Human Rights", "Sports")
)),
H3("Topic vs. Various Metrics"),
P(
"In the following section, we plot the cluster against their average score of a particular metric stored in the metadta. We recommend the readers to jump to the ones you are most interested in."
),
*(
Section(H4(title), plotly2fasthtml(topic_graphs[i]), P(data.get("comment", '')))
for i, (title, data) in enumerate(topic_charts)
)
)
)
def results():
return Div(
Section(
intro_div,
id="section51"
),
Section(
upsampling_exp,
id="section52"
),
Section(
preplexity_intro_div,
id="section53"
),
Section(
perp1_div,
id="section54"
),
Section(
llama_div,
),
Section(
cluster_div,
id="section55"
),
id="inner-text"
)