Add files via upload

This commit is contained in:
alainnothere 2026-03-19 02:02:55 +00:00 committed by GitHub
parent add2765a15
commit a3d2a715fe
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -0,0 +1,43 @@
{"is_baseline": true, "dup_start": -1, "dup_end": -1, "math_score": 0.7405238987432614, "eq_score": 94.4921875, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:01:19.488780"}
{"dup_start": 6, "dup_end": 9, "n_dup_layers": 3, "math_score": 0.7805742475441455, "eq_score": 95.703125, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:03:46.745090"}
{"dup_start": 9, "dup_end": 12, "n_dup_layers": 3, "math_score": 0.7247009876556773, "eq_score": 95.0390625, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:06:20.446245"}
{"dup_start": 12, "dup_end": 15, "n_dup_layers": 3, "math_score": 0.7257775592300113, "eq_score": 94.140625, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:08:36.019052"}
{"dup_start": 15, "dup_end": 18, "n_dup_layers": 3, "math_score": 0.749302485585077, "eq_score": 95.7421875, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:11:00.943316"}
{"dup_start": 18, "dup_end": 21, "n_dup_layers": 3, "math_score": 0.7204157812814636, "eq_score": 93.3984375, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:13:30.623844"}
{"dup_start": 21, "dup_end": 24, "n_dup_layers": 3, "math_score": 0.7106833702644649, "eq_score": 92.96875, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:15:57.703249"}
{"dup_start": 24, "dup_end": 27, "n_dup_layers": 3, "math_score": 0.6487107864763348, "eq_score": 95.2734375, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:18:23.670215"}
{"dup_start": 27, "dup_end": 30, "n_dup_layers": 3, "math_score": 0.7180102727314654, "eq_score": 94.6484375, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:20:59.948323"}
{"dup_start": 30, "dup_end": 33, "n_dup_layers": 3, "math_score": 0.7138929582916131, "eq_score": 94.0234375, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:23:37.352238"}
{"dup_start": 33, "dup_end": 36, "n_dup_layers": 3, "math_score": 0.710407524578248, "eq_score": 94.53125, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:26:03.759148"}
{"dup_start": 36, "dup_end": 39, "n_dup_layers": 3, "math_score": 0.7017281399684466, "eq_score": 94.6875, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:28:23.001252"}
{"dup_start": 6, "dup_end": 10, "n_dup_layers": 4, "math_score": 0.8125148152897631, "eq_score": 96.3671875, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:30:48.154933"}
{"dup_start": 9, "dup_end": 13, "n_dup_layers": 4, "math_score": 0.7598022807991355, "eq_score": 95.078125, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:33:11.743074"}
{"dup_start": 12, "dup_end": 16, "n_dup_layers": 4, "math_score": 0.7481617437152214, "eq_score": 93.7109375, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:35:35.080032"}
{"dup_start": 15, "dup_end": 19, "n_dup_layers": 4, "math_score": 0.7617270013353001, "eq_score": 95.15625, "reasoning_score": 0.8235294117647058, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:38:05.893256"}
{"dup_start": 18, "dup_end": 22, "n_dup_layers": 4, "math_score": 0.6901500062751371, "eq_score": 92.265625, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:40:47.490837"}
{"dup_start": 21, "dup_end": 25, "n_dup_layers": 4, "math_score": 0.7287948603204509, "eq_score": 94.1015625, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:43:20.148715"}
{"dup_start": 24, "dup_end": 28, "n_dup_layers": 4, "math_score": 0.6822609151021245, "eq_score": 94.5703125, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:45:54.358123"}
{"dup_start": 27, "dup_end": 31, "n_dup_layers": 4, "math_score": 0.7224157574849671, "eq_score": 94.4140625, "reasoning_score": 0.8235294117647058, "reasoning_cats": {"causal": 0.3333333333333333, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:48:32.113005"}
{"dup_start": 30, "dup_end": 34, "n_dup_layers": 4, "math_score": 0.7070250448292428, "eq_score": 94.7265625, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:51:05.446835"}
{"dup_start": 33, "dup_end": 37, "n_dup_layers": 4, "math_score": 0.7008919981941004, "eq_score": 94.375, "reasoning_score": 1.0, "reasoning_cats": {"causal": 1.0, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:53:30.446053"}
{"dup_start": 36, "dup_end": 40, "n_dup_layers": 4, "math_score": 0.7057003835259786, "eq_score": 94.84375, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:56:04.479511"}
{"dup_start": 6, "dup_end": 11, "n_dup_layers": 5, "math_score": 0.8167558856236048, "eq_score": 95.625, "reasoning_score": 1.0, "reasoning_cats": {"causal": 1.0, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T19:58:37.162840"}
{"dup_start": 9, "dup_end": 14, "n_dup_layers": 5, "math_score": 0.7245442180746329, "eq_score": 95.234375, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:01:05.963620"}
{"dup_start": 12, "dup_end": 17, "n_dup_layers": 5, "math_score": 0.7824924859565509, "eq_score": 94.8828125, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:03:35.346446"}
{"dup_start": 15, "dup_end": 20, "n_dup_layers": 5, "math_score": 0.7832091102149359, "eq_score": 95.859375, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:06:08.259020"}
{"dup_start": 18, "dup_end": 23, "n_dup_layers": 5, "math_score": 0.720791473973756, "eq_score": 92.421875, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:08:47.317575"}
{"dup_start": 21, "dup_end": 26, "n_dup_layers": 5, "math_score": 0.7055170260892233, "eq_score": 92.890625, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:11:24.049734"}
{"dup_start": 24, "dup_end": 29, "n_dup_layers": 5, "math_score": 0.5825061294932379, "eq_score": 95.0390625, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:13:59.489114"}
{"dup_start": 27, "dup_end": 32, "n_dup_layers": 5, "math_score": 0.7088027122970938, "eq_score": 94.1796875, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:16:37.450324"}
{"dup_start": 30, "dup_end": 35, "n_dup_layers": 5, "math_score": 0.6787145825703289, "eq_score": 94.6875, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:19:16.869381"}
{"dup_start": 33, "dup_end": 38, "n_dup_layers": 5, "math_score": 0.665015604932646, "eq_score": 94.9609375, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:21:44.688514"}
{"dup_start": 6, "dup_end": 12, "n_dup_layers": 6, "math_score": 0.7691836044599836, "eq_score": 95.390625, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:24:20.779131"}
{"dup_start": 9, "dup_end": 15, "n_dup_layers": 6, "math_score": 0.7404999519432109, "eq_score": 94.6484375, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:26:44.297999"}
{"dup_start": 12, "dup_end": 18, "n_dup_layers": 6, "math_score": 0.7581846120997626, "eq_score": 94.5703125, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:29:08.091870"}
{"dup_start": 15, "dup_end": 21, "n_dup_layers": 6, "math_score": 0.7828286920833635, "eq_score": 93.515625, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:31:42.341391"}
{"dup_start": 18, "dup_end": 24, "n_dup_layers": 6, "math_score": 0.7307900469550004, "eq_score": 92.9296875, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 0.6666666666666666, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:34:26.215950"}
{"dup_start": 21, "dup_end": 27, "n_dup_layers": 6, "math_score": 0.6790520279170066, "eq_score": 92.5390625, "reasoning_score": 0.8235294117647058, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 0.6666666666666666, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:37:10.344673"}
{"dup_start": 24, "dup_end": 30, "n_dup_layers": 6, "math_score": 0.6767867848715058, "eq_score": 95.15625, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.6666666666666666, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:40:01.499627"}
{"dup_start": 27, "dup_end": 33, "n_dup_layers": 6, "math_score": 0.7743560625589063, "eq_score": 94.5703125, "reasoning_score": 0.9411764705882353, "reasoning_cats": {"causal": 1.0, "date": 0.6666666666666666, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:42:40.628671"}
{"dup_start": 30, "dup_end": 36, "n_dup_layers": 6, "math_score": 0.7414868249649326, "eq_score": 94.4140625, "reasoning_score": 0.8823529411764706, "reasoning_cats": {"causal": 0.3333333333333333, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:45:14.335813"}
{"dup_start": 33, "dup_end": 39, "n_dup_layers": 6, "math_score": 0.7346941242074608, "eq_score": 94.7265625, "reasoning_score": 1.0, "reasoning_cats": {"causal": 1.0, "date": 1.0, "logic": 1.0, "nav": 1.0, "gsm": 1.0}, "timestamp": "2026-03-18T20:47:54.004093"}