File size: 5,109 Bytes
d544291
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
,version,d_sae,layer,kl_div_with_sae,kl_div_with_ablation,ce_loss_with_sae,ce_loss_without_sae,ce_loss_with_ablation,kl_div_score,ce_loss_score,l2_norm_in,l2_norm_out,l2_ratio,l0,l1,explained_variance,mse,total_tokens_evaluated,filepath
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_0/metrics.json,5,128,0,0.0028826396446675062,3.094083309173584,3.6018943786621094,3.599064588546753,6.694648742675781,0.999068338064421,0.9990858623204987,29.933448791503906,29.71919822692871,0.9930059909820557,31.99934959411621,61.198638916015625,0.9775193929672241,13.276110649108887,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_0/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_1/metrics.json,5,128,1,0.004241525661200285,0.05105271190404892,3.599820852279663,3.599064588546753,3.6525371074676514,0.9169187002411934,0.9858569645086499,18.973735809326172,18.205364227294922,0.9327648878097534,32.0,84.0601806640625,0.9169172048568726,17.682374954223633,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_1/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_2/metrics.json,5,128,2,0.006751821842044592,0.05874736234545708,3.602034091949463,3.599064588546753,3.6459126472473145,0.8850702129852012,0.9366141632102598,49.106536865234375,47.9766845703125,0.912467360496521,31.984375,82.67613983154297,0.981090247631073,28.213790893554688,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_2/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_3/metrics.json,5,128,3,0.008531898260116577,0.07059153914451599,3.6077229976654053,3.599064588546753,3.658677577972412,0.8791370982484182,0.8547563341132242,16.98731803894043,15.537837028503418,0.8995180130004883,31.90511131286621,81.88644409179688,0.8274940252304077,38.814979553222656,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_3/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_4/metrics.json,5,128,4,0.010455957613885403,0.06332532316446304,3.6118924617767334,3.599064588546753,3.6600804328918457,0.8348850492759414,0.7897616042575971,17.251985549926758,15.434064865112305,0.8794459700584412,31.984375,78.37165832519531,0.780777633190155,50.81820297241211,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_4/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_5/metrics.json,5,128,5,0.011617729440331459,0.06850520521402359,3.6092593669891357,3.599064588546753,3.6693859100341797,0.8304109971784566,0.8550257841186103,18.888967514038086,16.669851303100586,0.8737667798995972,31.98372459411621,77.13916015625,0.7653716802597046,71.50291442871094,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_5/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_6/metrics.json,5,128,6,0.014023388735949993,0.07569437474012375,3.6142406463623047,3.599064588546753,3.67651629447937,0.814736712152052,0.8040577979166154,21.466564178466797,18.890602111816406,0.8757946491241455,31.99837303161621,74.61764526367188,0.754051685333252,97.22125244140625,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_6/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_7/metrics.json,5,128,7,0.014005273580551147,0.08048636466264725,3.6098315715789795,3.599064588546753,3.6727118492126465,0.8259919721899077,0.8538033467249813,25.444438934326172,22.559194564819336,0.8843803405761719,31.99788475036621,72.55130004882812,0.7648060321807861,130.78082275390625,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_7/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_8/metrics.json,5,128,8,0.0149507075548172,0.08732372522354126,3.6158981323242188,3.599064588546753,3.6803367137908936,0.828789856175459,0.7928743252757569,30.250225067138672,26.934555053710938,0.8884322047233582,31.99690818786621,72.55912780761719,0.7680301070213318,183.63497924804688,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_8/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_9/metrics.json,5,128,9,0.01591905765235424,0.09758877754211426,3.615844488143921,3.599064588546753,3.6962451934814453,0.8368761444369522,0.827332834484366,40.192413330078125,36.57688903808594,0.9057919383049011,32.0,68.9762954711914,0.7820959091186523,267.2160949707031,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_9/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_10/metrics.json,5,128,10,0.019077030941843987,0.12674781680107117,3.616905927658081,3.599064588546753,3.708984136581421,0.8494882876619082,0.8376872955691096,81.75682830810547,78.83488464355469,0.9609333872795105,32.0,48.323631286621094,0.819786787033081,443.10888671875,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_10/metrics.json
OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_11/metrics.json,5,128,11,0.024071572348475456,0.17384076118469238,3.620229721069336,3.599064588546753,3.783318281173706,0.8615309080308198,0.8851304838409143,92.90629577636719,88.29003143310547,0.9321191310882568,32.0,71.25521850585938,0.8613338470458984,635.45947265625,6144.0,OAI_GPT2Small_v5_128k_resid_delta_mlp/v5_128k_layer_11/metrics.json