From 1a3c4faf4e0a25ed0b86e8739d5319a634cb9112 Mon Sep 17 00:00:00 2001 From: Christian Krinitsin Date: Tue, 8 Jul 2025 08:55:39 +0000 Subject: add deepseek 70b result --- .../no-thinking-deepseek-r1:70b/categories.csv | 5 + .../output/instruction/1028 | 37 + .../output/instruction/1051 | 4 + .../output/instruction/1079080 | 13 + .../output/instruction/1086 | 72 ++ .../output/instruction/1092 | 17 + .../output/instruction/1095531 | 60 + .../output/instruction/1095857 | 14 + .../output/instruction/1128 | 27 + .../output/instruction/1129571 | 17 + .../output/instruction/1156 | 4 + .../output/instruction/1156313 | 129 ++ .../output/instruction/1178 | 4 + .../output/instruction/122 | 4 + .../output/instruction/1221966 | 37 + .../output/instruction/1233225 | 27 + .../output/instruction/1245543 | 26 + .../output/instruction/1246990 | 41 + .../output/instruction/1248 | 14 + .../output/instruction/1251 | 18 + .../output/instruction/1254786 | 45 + .../output/instruction/1267 | 96 ++ .../output/instruction/1267955 | 45 + .../output/instruction/1283519 | 13 + .../output/instruction/1308381 | 17 + .../output/instruction/1328996 | 6 + .../output/instruction/1339 | 19 + .../output/instruction/1361912 | 12 + .../output/instruction/1368 | 41 + .../output/instruction/1370 | 16 + .../output/instruction/1371 | 22 + .../output/instruction/1372 | 23 + .../output/instruction/1373 | 23 + .../output/instruction/1374 | 25 + .../output/instruction/1375 | 22 + .../output/instruction/1376 | 18 + .../output/instruction/1377 | 16 + .../output/instruction/1404690 | 41 + .../output/instruction/1412 | 8 + .../output/instruction/1428352 | 47 + .../output/instruction/1441 | 37 + .../output/instruction/1469342 | 6 + .../output/instruction/1471 | 19 + .../output/instruction/1494 | 935 ++++++++++++++ .../output/instruction/1536 | 19 + .../output/instruction/1541 | 35 + .../output/instruction/1553 | 15 + .../output/instruction/1574346 | 15 + .../output/instruction/1590336 | 18 + .../output/instruction/1594069 | 11 + .../output/instruction/1605123 | 31 + .../output/instruction/1606 | 32 + .../output/instruction/1611394 | 32 + .../output/instruction/1612 | 54 + .../output/instruction/1613817 | 59 + .../output/instruction/1620 | 97 ++ .../output/instruction/1637 | 4 + .../output/instruction/1641637 | 716 +++++++++++ .../output/instruction/1642 | 25 + .../output/instruction/1701821 | 217 ++++ .../output/instruction/1713066 | 22 + .../output/instruction/1722 | 90 ++ .../output/instruction/1725267 | 34 + .../output/instruction/1727737 | 28 + .../output/instruction/1737 | 52 + .../output/instruction/1738434 | 31 + .../output/instruction/1748296 | 28 + .../output/instruction/1751422 | 7 + .../output/instruction/1751494 | 39 + .../output/instruction/1756927 | 21 + .../output/instruction/1761401 | 13 + .../output/instruction/1771 | 36 + .../output/instruction/1779 | 33 + .../output/instruction/1779634 | 38 + .../output/instruction/1780 | 20 + .../output/instruction/1781281 | 31 + .../output/instruction/1785734 | 78 ++ .../output/instruction/1790 | 32 + .../output/instruction/1793119 | 32 + .../output/instruction/1793608 | 19 + .../output/instruction/1796520 | 39 + .../output/instruction/1806243 | 87 ++ .../output/instruction/1812451 | 17 + .../output/instruction/1812861 | 25 + .../output/instruction/1815024 | 18 + .../output/instruction/1818075 | 56 + .../output/instruction/1820686 | 8 + .../output/instruction/1821430 | 35 + .../output/instruction/1821444 | 32 + .../output/instruction/1821515 | 41 + .../output/instruction/1824778 | 10 + .../output/instruction/1826568 | 16 + .../output/instruction/1828867 | 11 + .../output/instruction/1832422 | 12 + .../output/instruction/1841990 | 41 + .../output/instruction/1847467 | 19 + .../output/instruction/1858415 | 27 + .../output/instruction/1859713 | 28 + .../output/instruction/1860056 | 23 + .../output/instruction/1861404 | 53 + .../output/instruction/1863247 | 11 + .../output/instruction/1873898 | 41 + .../output/instruction/1874888 | 46 + .../output/instruction/1877794 | 6 + .../output/instruction/1883784 | 12 + .../output/instruction/1885350 | 26 + .../output/instruction/1889288 | 10 + .../output/instruction/1892081 | 17 + .../output/instruction/1895471 | 26 + .../output/instruction/1901 | 22 + .../output/instruction/1904210 | 54 + .../output/instruction/1905356 | 15 + .../output/instruction/1907969 | 61 + .../output/instruction/1908 | 52 + .../output/instruction/1909 | 53 + .../output/instruction/1912934 | 20 + .../output/instruction/1914021 | 30 + .../output/instruction/1916269 | 22 + .../output/instruction/1918026 | 32 + .../output/instruction/1922887 | 33 + .../output/instruction/1925512 | 21 + .../output/instruction/1926759 | 21 + .../output/instruction/1927530 | 42 + .../output/instruction/1941 | 105 ++ .../output/instruction/1955 | 40 + .../output/instruction/2078 | 37 + .../output/instruction/2083 | 114 ++ .../output/instruction/2089 | 30 + .../output/instruction/2122 | 10 + .../output/instruction/2136 | 38 + .../output/instruction/2175 | 41 + .../output/instruction/2203 | 4 + .../output/instruction/2248 | 39 + .../output/instruction/2302 | 28 + .../output/instruction/2317 | 41 + .../output/instruction/2318 | 37 + .../output/instruction/2319 | 20 + .../output/instruction/2336 | 26 + .../output/instruction/2371 | 55 + .../output/instruction/2372 | 112 ++ .../output/instruction/2373 | 98 ++ .../output/instruction/2375 | 88 ++ .../output/instruction/2376 | 117 ++ .../output/instruction/2386 | 46 + .../output/instruction/2419 | 21 + .../output/instruction/2422 | 72 ++ .../output/instruction/2474 | 99 ++ .../output/instruction/2483 | 23 + .../output/instruction/2487 | 71 + .../output/instruction/2497 | 6 + .../output/instruction/2498 | 54 + .../output/instruction/2499 | 33 + .../output/instruction/2500 | 7 + .../output/instruction/2536 | 4 + .../output/instruction/2595 | 138 ++ .../output/instruction/2632 | 86 ++ .../output/instruction/2647 | 50 + .../output/instruction/266 | 4 + .../output/instruction/2672 | 23 + .../output/instruction/2696 | 15 + .../output/instruction/2730 | 13 + .../output/instruction/2802 | 29 + .../output/instruction/2865 | 55 + .../output/instruction/2878 | 4 + .../output/instruction/2971 | 47 + .../output/instruction/312 | 4 + .../output/instruction/333 | 4 + .../output/instruction/361 | 4 + .../output/instruction/364 | 4 + .../output/instruction/381 | 4 + .../output/instruction/390 | 4 + .../output/instruction/422 | 4 + .../output/instruction/427 | 4 + .../output/instruction/449 | 71 + .../output/instruction/494 | 4 + .../output/instruction/508 | 4 + .../output/instruction/514 | 28 + .../output/instruction/616 | 110 ++ .../output/instruction/618 | 98 ++ .../output/instruction/625 | 26 + .../output/instruction/754 | 210 +++ .../output/instruction/799 | 50 + .../output/instruction/824 | 15 + .../output/instruction/826 | 19 + .../output/instruction/837 | 33 + .../output/instruction/890 | 4 + .../output/instruction/904308 | 101 ++ .../output/instruction/947 | 16 + .../output/instruction/952 | 100 ++ .../output/instruction/984 | 26 + .../output/instruction/993 | 84 ++ .../output/instruction/998 | 63 + .../output/manual-review/1022 | 36 + .../output/manual-review/1550503 | 16 + .../output/manual-review/1593 | 10 + .../output/manual-review/1617929 | 53 + .../output/manual-review/1738545 | 34 + .../output/manual-review/1805913 | 24 + .../output/manual-review/1824344 | 48 + .../output/manual-review/1830 | 29 + .../output/manual-review/1833 | 87 ++ .../output/manual-review/1854738 | 31 + .../output/manual-review/1858461 | 26 + .../output/manual-review/1869782 | 16 + .../output/manual-review/1895 | 149 +++ .../output/manual-review/1898954 | 29 + .../output/manual-review/1906193 | 60 + .../output/manual-review/1908626 | 68 + .../output/manual-review/1910 | 65 + .../output/manual-review/1915327 | 37 + .../output/manual-review/1967248 | 41 + .../output/manual-review/2374 | 114 ++ .../output/manual-review/2448 | 49 + .../output/manual-review/2495 | 75 ++ .../output/manual-review/2553 | 85 ++ .../output/manual-review/2560 | 108 ++ .../output/manual-review/306 | 4 + .../output/manual-review/739785 | 37 + .../output/manual-review/829 | 17 + .../output/runtime/1010484 | 9 + .../output/runtime/1027 | 18 + .../output/runtime/1034 | 20 + .../output/runtime/1041 | 34 + .../output/runtime/1044 | 4 + .../output/runtime/1052857 | 18 + .../output/runtime/1054812 | 8 + .../output/runtime/1059 | 13 + .../output/runtime/1068900 | 8 + .../output/runtime/1070 | 13 + .../output/runtime/1075 | 19 + .../output/runtime/1093 | 36 + .../output/runtime/1098729 | 46 + .../output/runtime/1102 | 41 + .../output/runtime/1143 | 81 ++ .../output/runtime/1147 | 12 + .../output/runtime/1165383 | 6 + .../output/runtime/1172613 | 66 + .../output/runtime/1182490 | 79 ++ .../output/runtime/1187319 | 11 + .../output/runtime/1207896 | 6 + .../output/runtime/1209 | 8 + .../no-thinking-deepseek-r1:70b/output/runtime/121 | 4 + .../output/runtime/1211 | 10 + .../output/runtime/1228 | 46 + .../output/runtime/1245703 | 12 + .../output/runtime/1248168 | 27 + .../output/runtime/1254828 | 40 + .../output/runtime/1255 | 14 + .../output/runtime/1261743 | 8 + .../output/runtime/1285363 | 48 + .../output/runtime/1287195 | 6 + .../output/runtime/1294898 | 81 ++ .../output/runtime/1311614 | 50 + .../output/runtime/1319100 | 72 ++ .../output/runtime/1346784 | 70 + .../output/runtime/1357206 | 62 + .../output/runtime/1357226 | 14 + .../output/runtime/1362635 | 45 + .../output/runtime/1388 | 17 + .../output/runtime/1429313 | 12 + .../output/runtime/1435 | 19 + .../output/runtime/1478 | 69 + .../output/runtime/1495 | 9 + .../output/runtime/1512 | 4 + .../output/runtime/1519037 | 10 + .../output/runtime/1527765 | 75 ++ .../output/runtime/1528 | 12 + .../output/runtime/1528239 | 48 + .../output/runtime/1531 | 18 + .../output/runtime/1533141 | 18 + .../output/runtime/1547 | 15 + .../output/runtime/1568107 | 12 + .../output/runtime/1591611 | 26 + .../output/runtime/1603734 | 10 + .../output/runtime/1614348 | 42 + .../output/runtime/1623020 | 58 + .../output/runtime/1641861 | 39 + .../output/runtime/1648 | 61 + .../output/runtime/1654137 | 10 + .../output/runtime/1659901 | 12 + .../output/runtime/1661815 | 29 + .../output/runtime/1667401 | 70 + .../output/runtime/1671 | 1360 ++++++++++++++++++++ .../output/runtime/1697 | 22 + .../output/runtime/1704638 | 68 + .../output/runtime/1715162 | 75 ++ .../output/runtime/1724485 | 21 + .../output/runtime/1735384 | 23 + .../output/runtime/1736 | 70 + .../output/runtime/1737444 | 96 ++ .../output/runtime/1740219 | 62 + .../output/runtime/1741 | 4 + .../output/runtime/1748612 | 18 + .../output/runtime/1755 | 23 + .../output/runtime/1756519 | 49 + .../output/runtime/1756807 | 70 + .../output/runtime/1761535 | 39 + .../output/runtime/1763 | 15 + .../output/runtime/1763536 | 86 ++ .../output/runtime/1765970 | 64 + .../output/runtime/1768 | 35 + .../output/runtime/1768246 | 16 + .../output/runtime/1773743 | 24 + .../output/runtime/1774149 | 79 ++ .../output/runtime/1793539 | 12 + .../output/runtime/1798 | 4 + .../output/runtime/1799200 | 43 + .../output/runtime/1805 | 69 + .../output/runtime/1808565 | 10 + .../output/runtime/1809546 | 46 + .../output/runtime/1812 | 28 + .../output/runtime/1813398 | 44 + .../output/runtime/1814128 | 158 +++ .../output/runtime/1818483 | 45 + .../output/runtime/1819 | 13 + .../output/runtime/1832353 | 23 + .../output/runtime/1832916 | 8 + .../output/runtime/1833668 | 30 + .../output/runtime/1834496 | 30 + .../output/runtime/1835693 | 20 + .../output/runtime/1835839 | 24 + .../output/runtime/1836078 | 25 + .../output/runtime/1836192 | 24 + .../output/runtime/1836558 | 51 + .../output/runtime/1840922 | 24 + .../output/runtime/1854 | 21 + .../output/runtime/1857 | 55 + .../output/runtime/1860610 | 10 + .../output/runtime/1861605 | 19 + .../output/runtime/1862167 | 6 + .../output/runtime/1862986 | 67 + .../output/runtime/1863445 | 19 + .../output/runtime/1869073 | 10 + .../output/runtime/1878501 | 34 + .../output/runtime/1880225 | 140 ++ .../output/runtime/1880332 | 10 + .../output/runtime/1880722 | 17 + .../output/runtime/1881450 | 26 + .../output/runtime/1883268 | 40 + .../output/runtime/1888303 | 23 + .../output/runtime/1888728 | 22 + .../output/runtime/1889411 | 66 + .../output/runtime/1890 | 28 + .../output/runtime/1894029 | 42 + .../output/runtime/1895080 | 39 + .../output/runtime/1895305 | 51 + .../output/runtime/1895703 | 21 + .../output/runtime/1904259 | 32 + .../output/runtime/1906536 | 33 + .../output/runtime/1907817 | 46 + .../output/runtime/1908551 | 57 + .../output/runtime/1909921 | 25 + .../output/runtime/1913 | 22 + .../output/runtime/1913913 | 21 + .../output/runtime/1914870 | 60 + .../output/runtime/1915531 | 57 + .../output/runtime/1916344 | 27 + .../output/runtime/1917184 | 8 + .../output/runtime/1926202 | 21 + .../output/runtime/1930 | 49 + .../output/runtime/1936977 | 10 + .../output/runtime/1952 | 99 ++ .../output/runtime/1953 | 149 +++ .../output/runtime/2027 | 236 ++++ .../output/runtime/2035 | 57 + .../output/runtime/2072564 | 48 + .../output/runtime/2082 | 47 + .../output/runtime/2101 | 20 + .../output/runtime/2119 | 4 + .../output/runtime/2127 | 4 + .../output/runtime/2156 | 18 + .../output/runtime/2157 | 46 + .../output/runtime/2208 | 91 ++ .../output/runtime/2223 | 38 + .../output/runtime/2304 | 41 + .../output/runtime/2309 | 34 + .../output/runtime/2460 | 11 + .../output/runtime/2485 | 50 + .../output/runtime/2486 | 15 + .../output/runtime/2505 | 4 + .../output/runtime/2525 | 4 + .../output/runtime/2569 | 8 + .../output/runtime/2580 | 15 + .../output/runtime/2590 | 26 + .../output/runtime/2596 | 4 + .../output/runtime/2598 | 4 + .../output/runtime/2604 | 47 + .../no-thinking-deepseek-r1:70b/output/runtime/261 | 4 + .../output/runtime/2619 | 4 + .../output/runtime/2628 | 23 + .../output/runtime/2655 | 42 + .../output/runtime/2683 | 42 + .../output/runtime/2761 | 11 + .../output/runtime/2775 | 137 ++ .../no-thinking-deepseek-r1:70b/output/runtime/280 | 4 + .../output/runtime/2815 | 4 + .../output/runtime/2846 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/311 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/324 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/355 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/385 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/419 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/442 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/447 | 4 + .../output/runtime/562107 | 15 + .../output/runtime/645662 | 43 + .../no-thinking-deepseek-r1:70b/output/runtime/693 | 13 + .../no-thinking-deepseek-r1:70b/output/runtime/695 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/697 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/698 | 361 ++++++ .../output/runtime/754635 | 58 + .../output/runtime/796480 | 48 + .../no-thinking-deepseek-r1:70b/output/runtime/805 | 17 + .../no-thinking-deepseek-r1:70b/output/runtime/866 | 56 + .../output/runtime/886621 | 295 +++++ .../no-thinking-deepseek-r1:70b/output/runtime/909 | 14 + .../no-thinking-deepseek-r1:70b/output/runtime/922 | 23 + .../no-thinking-deepseek-r1:70b/output/runtime/939 | 78 ++ .../no-thinking-deepseek-r1:70b/output/runtime/95 | 4 + .../no-thinking-deepseek-r1:70b/output/runtime/967 | 227 ++++ .../no-thinking-deepseek-r1:70b/output/runtime/979 | 10 + .../output/syscall/1007 | 4 + .../output/syscall/1010 | 81 ++ .../output/syscall/1012 | 44 + .../output/syscall/1031920 | 40 + .../output/syscall/1033 | 30 + .../output/syscall/1054831 | 20 + .../output/syscall/1066909 | 10 + .../output/syscall/1072 | 27 + .../output/syscall/1075272 | 16 + .../output/syscall/1075339 | 6 + .../output/syscall/1076445 | 48 + .../output/syscall/1111 | 21 + .../output/syscall/1238 | 122 ++ .../output/syscall/1254672 | 44 + .../output/syscall/1261 | 28 + .../output/syscall/1263747 | 32 + .../no-thinking-deepseek-r1:70b/output/syscall/127 | 4 + .../output/syscall/1346769 | 39 + .../output/syscall/1356916 | 9 + .../output/syscall/1361 | 23 + .../output/syscall/1394 | 64 + .../output/syscall/1397 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/140 | 4 + .../output/syscall/1416988 | 35 + .../output/syscall/1452 | 4 + .../output/syscall/1457275 | 108 ++ .../output/syscall/1462640 | 38 + .../output/syscall/1470170 | 43 + .../output/syscall/1516408 | 34 + .../output/syscall/1563612 | 53 + .../output/syscall/1585840 | 12 + .../output/syscall/1594394 | 44 + .../output/syscall/1605443 | 14 + .../output/syscall/1619896 | 53 + .../output/syscall/1643619 | 35 + .../output/syscall/1650 | 17 + .../output/syscall/1673976 | 14 + .../output/syscall/1689367 | 29 + .../output/syscall/1696353 | 38 + .../output/syscall/1696773 | 10 + .../output/syscall/1701808 | 19 + .../output/syscall/1701971 | 48 + .../output/syscall/1701973 | 20 + .../output/syscall/1701974 | 20 + .../output/syscall/1707 | 26 + .../output/syscall/1716292 | 33 + .../output/syscall/1716767 | 37 + .../output/syscall/1726394 | 8 + .../output/syscall/1728116 | 50 + .../output/syscall/1729 | 50 + .../output/syscall/1734 | 19 + .../output/syscall/1734792 | 10 + .../output/syscall/1749393 | 29 + .../output/syscall/1756 | 46 + .../output/syscall/1760 | 56 + .../output/syscall/1761153 | 26 + .../output/syscall/1770 | 25 + .../output/syscall/1776478 | 49 + .../output/syscall/1777226 | 18 + .../output/syscall/1783362 | 50 + .../output/syscall/1785203 | 46 + .../output/syscall/1791763 | 16 + .../output/syscall/1791796 | 126 ++ .../output/syscall/1807 | 27 + .../output/syscall/1808563 | 20 + .../output/syscall/1810433 | 50 + .../output/syscall/1813307 | 24 + .../output/syscall/1821006 | 38 + .../output/syscall/1829459 | 38 + .../output/syscall/1837 | 38 + .../output/syscall/1857811 | 10 + .../output/syscall/1860053 | 23 + .../output/syscall/1861341 | 33 + .../output/syscall/1869241 | 22 + .../output/syscall/1870477 | 36 + .../output/syscall/1876373 | 51 + .../output/syscall/1884719 | 135 ++ .../output/syscall/1886097 | 36 + .../output/syscall/1887306 | 58 + .../output/syscall/1893010 | 8 + .../output/syscall/1894361 | 8 + .../output/syscall/1910605 | 19 + .../output/syscall/1915925 | 20 + .../output/syscall/1926044 | 33 + .../output/syscall/1926246 | 53 + .../output/syscall/1926521 | 65 + .../output/syscall/1926996 | 23 + .../output/syscall/2112 | 29 + .../output/syscall/2123 | 34 + .../output/syscall/2168 | 35 + .../output/syscall/2170 | 47 + .../output/syscall/2197 | 61 + .../output/syscall/2262 | 202 +++ .../output/syscall/2333 | 48 + .../output/syscall/2353 | 59 + .../output/syscall/2390 | 66 + .../output/syscall/2410 | 95 ++ .../output/syscall/2446 | 63 + .../output/syscall/2504 | 10 + .../output/syscall/2592 | 40 + .../output/syscall/2606 | 201 +++ .../no-thinking-deepseek-r1:70b/output/syscall/263 | 4 + .../output/syscall/2738 | 13 + .../no-thinking-deepseek-r1:70b/output/syscall/275 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/276 | 4 + .../output/syscall/2825 | 40 + .../no-thinking-deepseek-r1:70b/output/syscall/326 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/356 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/456 | 32 + .../no-thinking-deepseek-r1:70b/output/syscall/470 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/570 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/577 | 28 + .../no-thinking-deepseek-r1:70b/output/syscall/578 | 33 + .../no-thinking-deepseek-r1:70b/output/syscall/579 | 53 + .../no-thinking-deepseek-r1:70b/output/syscall/602 | 16 + .../no-thinking-deepseek-r1:70b/output/syscall/633 | 35 + .../no-thinking-deepseek-r1:70b/output/syscall/654 | 26 + .../no-thinking-deepseek-r1:70b/output/syscall/690 | 22 + .../no-thinking-deepseek-r1:70b/output/syscall/704 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/714 | 46 + .../no-thinking-deepseek-r1:70b/output/syscall/817 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/833 | 45 + .../no-thinking-deepseek-r1:70b/output/syscall/834 | 62 + .../no-thinking-deepseek-r1:70b/output/syscall/836 | 88 ++ .../no-thinking-deepseek-r1:70b/output/syscall/856 | 64 + .../no-thinking-deepseek-r1:70b/output/syscall/871 | 17 + .../no-thinking-deepseek-r1:70b/output/syscall/885 | 4 + .../no-thinking-deepseek-r1:70b/output/syscall/911 | 20 + .../no-thinking-deepseek-r1:70b/output/syscall/927 | 35 + .../no-thinking-deepseek-r1:70b/output/syscall/957 | 74 ++ .../no-thinking-deepseek-r1:70b/output/syscall/982 | 40 + .../reasoning/instruction/1028 | 3 + .../reasoning/instruction/1051 | 11 + .../reasoning/instruction/1079080 | 3 + .../reasoning/instruction/1086 | 5 + .../reasoning/instruction/1092 | 1 + .../reasoning/instruction/1095531 | 3 + .../reasoning/instruction/1095857 | 3 + .../reasoning/instruction/1128 | 5 + .../reasoning/instruction/1129571 | 3 + .../reasoning/instruction/1156 | 1 + .../reasoning/instruction/1156313 | 3 + .../reasoning/instruction/1178 | 11 + .../reasoning/instruction/122 | 1 + .../reasoning/instruction/1221966 | 7 + .../reasoning/instruction/1233225 | 5 + .../reasoning/instruction/1245543 | 3 + .../reasoning/instruction/1246990 | 3 + .../reasoning/instruction/1248 | 3 + .../reasoning/instruction/1251 | 3 + .../reasoning/instruction/1254786 | 3 + .../reasoning/instruction/1267 | 3 + .../reasoning/instruction/1267955 | 3 + .../reasoning/instruction/1283519 | 3 + .../reasoning/instruction/1308381 | 3 + .../reasoning/instruction/1328996 | 3 + .../reasoning/instruction/1339 | 7 + .../reasoning/instruction/1361912 | 3 + .../reasoning/instruction/1368 | 3 + .../reasoning/instruction/1370 | 1 + .../reasoning/instruction/1371 | 3 + .../reasoning/instruction/1372 | 3 + .../reasoning/instruction/1373 | 3 + .../reasoning/instruction/1374 | 1 + .../reasoning/instruction/1375 | 1 + .../reasoning/instruction/1376 | 3 + .../reasoning/instruction/1377 | 3 + .../reasoning/instruction/1404690 | 21 + .../reasoning/instruction/1412 | 3 + .../reasoning/instruction/1428352 | 5 + .../reasoning/instruction/1441 | 3 + .../reasoning/instruction/1469342 | 1 + .../reasoning/instruction/1471 | 27 + .../reasoning/instruction/1494 | 3 + .../reasoning/instruction/1536 | 3 + .../reasoning/instruction/1541 | 5 + .../reasoning/instruction/1553 | 3 + .../reasoning/instruction/1574346 | 1 + .../reasoning/instruction/1590336 | 3 + .../reasoning/instruction/1594069 | 1 + .../reasoning/instruction/1605123 | 3 + .../reasoning/instruction/1606 | 3 + .../reasoning/instruction/1611394 | 3 + .../reasoning/instruction/1612 | 3 + .../reasoning/instruction/1613817 | 3 + .../reasoning/instruction/1620 | 3 + .../reasoning/instruction/1637 | 3 + .../reasoning/instruction/1641637 | 5 + .../reasoning/instruction/1642 | 4 + .../reasoning/instruction/1701821 | 3 + .../reasoning/instruction/1713066 | 1 + .../reasoning/instruction/1722 | 5 + .../reasoning/instruction/1725267 | 7 + .../reasoning/instruction/1727737 | 17 + .../reasoning/instruction/1737 | 3 + .../reasoning/instruction/1738434 | 3 + .../reasoning/instruction/1748296 | 3 + .../reasoning/instruction/1751422 | 1 + .../reasoning/instruction/1751494 | 16 + .../reasoning/instruction/1756927 | 5 + .../reasoning/instruction/1761401 | 3 + .../reasoning/instruction/1771 | 5 + .../reasoning/instruction/1779 | 3 + .../reasoning/instruction/1779634 | 7 + .../reasoning/instruction/1780 | 1 + .../reasoning/instruction/1781281 | 3 + .../reasoning/instruction/1785734 | 3 + .../reasoning/instruction/1790 | 3 + .../reasoning/instruction/1793119 | 3 + .../reasoning/instruction/1793608 | 1 + .../reasoning/instruction/1796520 | 3 + .../reasoning/instruction/1806243 | 3 + .../reasoning/instruction/1812451 | 3 + .../reasoning/instruction/1812861 | 3 + .../reasoning/instruction/1815024 | 1 + .../reasoning/instruction/1818075 | 3 + .../reasoning/instruction/1820686 | 1 + .../reasoning/instruction/1821430 | 3 + .../reasoning/instruction/1821444 | 7 + .../reasoning/instruction/1821515 | 3 + .../reasoning/instruction/1824778 | 3 + .../reasoning/instruction/1826568 | 3 + .../reasoning/instruction/1828867 | 3 + .../reasoning/instruction/1832422 | 25 + .../reasoning/instruction/1841990 | 7 + .../reasoning/instruction/1847467 | 3 + .../reasoning/instruction/1858415 | 3 + .../reasoning/instruction/1859713 | 7 + .../reasoning/instruction/1860056 | 7 + .../reasoning/instruction/1861404 | 3 + .../reasoning/instruction/1863247 | 3 + .../reasoning/instruction/1873898 | 3 + .../reasoning/instruction/1874888 | 15 + .../reasoning/instruction/1877794 | 7 + .../reasoning/instruction/1883784 | 3 + .../reasoning/instruction/1885350 | 5 + .../reasoning/instruction/1889288 | 10 + .../reasoning/instruction/1892081 | 1 + .../reasoning/instruction/1895471 | 5 + .../reasoning/instruction/1901 | 3 + .../reasoning/instruction/1904210 | 12 + .../reasoning/instruction/1905356 | 3 + .../reasoning/instruction/1907969 | 3 + .../reasoning/instruction/1908 | 10 + .../reasoning/instruction/1909 | 3 + .../reasoning/instruction/1912934 | 5 + .../reasoning/instruction/1914021 | 7 + .../reasoning/instruction/1916269 | 3 + .../reasoning/instruction/1918026 | 3 + .../reasoning/instruction/1922887 | 3 + .../reasoning/instruction/1925512 | 3 + .../reasoning/instruction/1926759 | 3 + .../reasoning/instruction/1927530 | 3 + .../reasoning/instruction/1941 | 3 + .../reasoning/instruction/1955 | 3 + .../reasoning/instruction/2078 | 10 + .../reasoning/instruction/2083 | 3 + .../reasoning/instruction/2089 | 3 + .../reasoning/instruction/2122 | 18 + .../reasoning/instruction/2136 | 3 + .../reasoning/instruction/2175 | 3 + .../reasoning/instruction/2203 | 1 + .../reasoning/instruction/2248 | 3 + .../reasoning/instruction/2302 | 1 + .../reasoning/instruction/2317 | 3 + .../reasoning/instruction/2318 | 3 + .../reasoning/instruction/2319 | 3 + .../reasoning/instruction/2336 | 3 + .../reasoning/instruction/2371 | 3 + .../reasoning/instruction/2372 | 3 + .../reasoning/instruction/2373 | 3 + .../reasoning/instruction/2375 | 3 + .../reasoning/instruction/2376 | 3 + .../reasoning/instruction/2386 | 3 + .../reasoning/instruction/2419 | 3 + .../reasoning/instruction/2422 | 3 + .../reasoning/instruction/2474 | 3 + .../reasoning/instruction/2483 | 3 + .../reasoning/instruction/2487 | 3 + .../reasoning/instruction/2497 | 3 + .../reasoning/instruction/2498 | 3 + .../reasoning/instruction/2499 | 3 + .../reasoning/instruction/2500 | 3 + .../reasoning/instruction/2536 | 1 + .../reasoning/instruction/2595 | 3 + .../reasoning/instruction/2632 | 3 + .../reasoning/instruction/2647 | 3 + .../reasoning/instruction/266 | 1 + .../reasoning/instruction/2672 | 13 + .../reasoning/instruction/2696 | 3 + .../reasoning/instruction/2730 | 3 + .../reasoning/instruction/2802 | 3 + .../reasoning/instruction/2865 | 3 + .../reasoning/instruction/2878 | 3 + .../reasoning/instruction/2971 | 3 + .../reasoning/instruction/312 | 1 + .../reasoning/instruction/333 | 3 + .../reasoning/instruction/361 | 1 + .../reasoning/instruction/364 | 3 + .../reasoning/instruction/381 | 3 + .../reasoning/instruction/390 | 1 + .../reasoning/instruction/422 | 16 + .../reasoning/instruction/427 | 3 + .../reasoning/instruction/449 | 3 + .../reasoning/instruction/494 | 3 + .../reasoning/instruction/508 | 1 + .../reasoning/instruction/514 | 3 + .../reasoning/instruction/616 | 3 + .../reasoning/instruction/618 | 8 + .../reasoning/instruction/625 | 3 + .../reasoning/instruction/754 | 3 + .../reasoning/instruction/799 | 3 + .../reasoning/instruction/824 | 3 + .../reasoning/instruction/826 | 3 + .../reasoning/instruction/837 | 5 + .../reasoning/instruction/890 | 1 + .../reasoning/instruction/904308 | 3 + .../reasoning/instruction/947 | 3 + .../reasoning/instruction/952 | 3 + .../reasoning/instruction/984 | 3 + .../reasoning/instruction/993 | 3 + .../reasoning/instruction/998 | 3 + .../reasoning/manual-review/1022 | 9 + .../reasoning/manual-review/1550503 | 9 + .../reasoning/manual-review/1593 | 7 + .../reasoning/manual-review/1617929 | 5 + .../reasoning/manual-review/1738545 | 13 + .../reasoning/manual-review/1805913 | 3 + .../reasoning/manual-review/1824344 | 18 + .../reasoning/manual-review/1830 | 14 + .../reasoning/manual-review/1833 | 21 + .../reasoning/manual-review/1854738 | 11 + .../reasoning/manual-review/1858461 | 7 + .../reasoning/manual-review/1869782 | 11 + .../reasoning/manual-review/1895 | 7 + .../reasoning/manual-review/1898954 | 5 + .../reasoning/manual-review/1906193 | 13 + .../reasoning/manual-review/1908626 | 7 + .../reasoning/manual-review/1910 | 14 + .../reasoning/manual-review/1915327 | 7 + .../reasoning/manual-review/1967248 | 9 + .../reasoning/manual-review/2374 | 20 + .../reasoning/manual-review/2448 | 5 + .../reasoning/manual-review/2495 | 7 + .../reasoning/manual-review/2553 | 12 + .../reasoning/manual-review/2560 | 5 + .../reasoning/manual-review/306 | 1 + .../reasoning/manual-review/739785 | 11 + .../reasoning/manual-review/829 | 18 + .../reasoning/runtime/1010484 | 9 + .../reasoning/runtime/1027 | 3 + .../reasoning/runtime/1034 | 1 + .../reasoning/runtime/1041 | 11 + .../reasoning/runtime/1044 | 1 + .../reasoning/runtime/1052857 | 5 + .../reasoning/runtime/1054812 | 3 + .../reasoning/runtime/1059 | 23 + .../reasoning/runtime/1068900 | 3 + .../reasoning/runtime/1070 | 3 + .../reasoning/runtime/1075 | 3 + .../reasoning/runtime/1093 | 3 + .../reasoning/runtime/1098729 | 13 + .../reasoning/runtime/1102 | 5 + .../reasoning/runtime/1143 | 3 + .../reasoning/runtime/1147 | 3 + .../reasoning/runtime/1165383 | 3 + .../reasoning/runtime/1172613 | 3 + .../reasoning/runtime/1182490 | 3 + .../reasoning/runtime/1187319 | 3 + .../reasoning/runtime/1207896 | 9 + .../reasoning/runtime/1209 | 1 + .../reasoning/runtime/121 | 3 + .../reasoning/runtime/1211 | 1 + .../reasoning/runtime/1228 | 3 + .../reasoning/runtime/1245703 | 3 + .../reasoning/runtime/1248168 | 3 + .../reasoning/runtime/1254828 | 3 + .../reasoning/runtime/1255 | 5 + .../reasoning/runtime/1261743 | 3 + .../reasoning/runtime/1285363 | 3 + .../reasoning/runtime/1287195 | 11 + .../reasoning/runtime/1294898 | 3 + .../reasoning/runtime/1311614 | 3 + .../reasoning/runtime/1319100 | 9 + .../reasoning/runtime/1346784 | 3 + .../reasoning/runtime/1357206 | 3 + .../reasoning/runtime/1357226 | 3 + .../reasoning/runtime/1362635 | 5 + .../reasoning/runtime/1388 | 3 + .../reasoning/runtime/1429313 | 3 + .../reasoning/runtime/1435 | 3 + .../reasoning/runtime/1478 | 3 + .../reasoning/runtime/1495 | 3 + .../reasoning/runtime/1512 | 3 + .../reasoning/runtime/1519037 | 3 + .../reasoning/runtime/1527765 | 3 + .../reasoning/runtime/1528 | 3 + .../reasoning/runtime/1528239 | 3 + .../reasoning/runtime/1531 | 3 + .../reasoning/runtime/1533141 | 3 + .../reasoning/runtime/1547 | 3 + .../reasoning/runtime/1568107 | 3 + .../reasoning/runtime/1591611 | 7 + .../reasoning/runtime/1603734 | 3 + .../reasoning/runtime/1614348 | 1 + .../reasoning/runtime/1623020 | 5 + .../reasoning/runtime/1641861 | 3 + .../reasoning/runtime/1648 | 4 + .../reasoning/runtime/1654137 | 5 + .../reasoning/runtime/1659901 | 3 + .../reasoning/runtime/1661815 | 3 + .../reasoning/runtime/1667401 | 3 + .../reasoning/runtime/1671 | 3 + .../reasoning/runtime/1697 | 3 + .../reasoning/runtime/1704638 | 3 + .../reasoning/runtime/1715162 | 3 + .../reasoning/runtime/1724485 | 3 + .../reasoning/runtime/1735384 | 15 + .../reasoning/runtime/1736 | 3 + .../reasoning/runtime/1737444 | 15 + .../reasoning/runtime/1740219 | 3 + .../reasoning/runtime/1741 | 3 + .../reasoning/runtime/1748612 | 3 + .../reasoning/runtime/1755 | 3 + .../reasoning/runtime/1756519 | 3 + .../reasoning/runtime/1756807 | 3 + .../reasoning/runtime/1761535 | 5 + .../reasoning/runtime/1763 | 3 + .../reasoning/runtime/1763536 | 3 + .../reasoning/runtime/1765970 | 5 + .../reasoning/runtime/1768 | 3 + .../reasoning/runtime/1768246 | 3 + .../reasoning/runtime/1773743 | 3 + .../reasoning/runtime/1774149 | 3 + .../reasoning/runtime/1793539 | 3 + .../reasoning/runtime/1798 | 7 + .../reasoning/runtime/1799200 | 3 + .../reasoning/runtime/1805 | 5 + .../reasoning/runtime/1808565 | 5 + .../reasoning/runtime/1809546 | 3 + .../reasoning/runtime/1812 | 3 + .../reasoning/runtime/1813398 | 9 + .../reasoning/runtime/1814128 | 3 + .../reasoning/runtime/1818483 | 5 + .../reasoning/runtime/1819 | 3 + .../reasoning/runtime/1832353 | 3 + .../reasoning/runtime/1832916 | 1 + .../reasoning/runtime/1833668 | 5 + .../reasoning/runtime/1834496 | 3 + .../reasoning/runtime/1835693 | 3 + .../reasoning/runtime/1835839 | 3 + .../reasoning/runtime/1836078 | 3 + .../reasoning/runtime/1836192 | 3 + .../reasoning/runtime/1836558 | 10 + .../reasoning/runtime/1840922 | 3 + .../reasoning/runtime/1854 | 3 + .../reasoning/runtime/1857 | 3 + .../reasoning/runtime/1860610 | 3 + .../reasoning/runtime/1861605 | 3 + .../reasoning/runtime/1862167 | 7 + .../reasoning/runtime/1862986 | 3 + .../reasoning/runtime/1863445 | 3 + .../reasoning/runtime/1869073 | 3 + .../reasoning/runtime/1878501 | 3 + .../reasoning/runtime/1880225 | 13 + .../reasoning/runtime/1880332 | 3 + .../reasoning/runtime/1880722 | 11 + .../reasoning/runtime/1881450 | 7 + .../reasoning/runtime/1883268 | 3 + .../reasoning/runtime/1888303 | 3 + .../reasoning/runtime/1888728 | 3 + .../reasoning/runtime/1889411 | 3 + .../reasoning/runtime/1890 | 3 + .../reasoning/runtime/1894029 | 5 + .../reasoning/runtime/1895080 | 3 + .../reasoning/runtime/1895305 | 3 + .../reasoning/runtime/1895703 | 3 + .../reasoning/runtime/1904259 | 3 + .../reasoning/runtime/1906536 | 3 + .../reasoning/runtime/1907817 | 3 + .../reasoning/runtime/1908551 | 7 + .../reasoning/runtime/1909921 | 3 + .../reasoning/runtime/1913 | 10 + .../reasoning/runtime/1913913 | 3 + .../reasoning/runtime/1914870 | 5 + .../reasoning/runtime/1915531 | 5 + .../reasoning/runtime/1916344 | 1 + .../reasoning/runtime/1917184 | 5 + .../reasoning/runtime/1926202 | 3 + .../reasoning/runtime/1930 | 20 + .../reasoning/runtime/1936977 | 3 + .../reasoning/runtime/1952 | 3 + .../reasoning/runtime/1953 | 5 + .../reasoning/runtime/2027 | 5 + .../reasoning/runtime/2035 | 3 + .../reasoning/runtime/2072564 | 3 + .../reasoning/runtime/2082 | 3 + .../reasoning/runtime/2101 | 30 + .../reasoning/runtime/2119 | 3 + .../reasoning/runtime/2127 | 3 + .../reasoning/runtime/2156 | 3 + .../reasoning/runtime/2157 | 3 + .../reasoning/runtime/2208 | 3 + .../reasoning/runtime/2223 | 3 + .../reasoning/runtime/2304 | 5 + .../reasoning/runtime/2309 | 3 + .../reasoning/runtime/2460 | 3 + .../reasoning/runtime/2485 | 3 + .../reasoning/runtime/2486 | 3 + .../reasoning/runtime/2505 | 3 + .../reasoning/runtime/2525 | 16 + .../reasoning/runtime/2569 | 3 + .../reasoning/runtime/2580 | 3 + .../reasoning/runtime/2590 | 5 + .../reasoning/runtime/2596 | 3 + .../reasoning/runtime/2598 | 3 + .../reasoning/runtime/2604 | 3 + .../reasoning/runtime/261 | 18 + .../reasoning/runtime/2619 | 3 + .../reasoning/runtime/2628 | 5 + .../reasoning/runtime/2655 | 3 + .../reasoning/runtime/2683 | 5 + .../reasoning/runtime/2761 | 3 + .../reasoning/runtime/2775 | 3 + .../reasoning/runtime/280 | 7 + .../reasoning/runtime/2815 | 5 + .../reasoning/runtime/2846 | 3 + .../reasoning/runtime/311 | 1 + .../reasoning/runtime/324 | 3 + .../reasoning/runtime/355 | 3 + .../reasoning/runtime/385 | 3 + .../reasoning/runtime/419 | 3 + .../reasoning/runtime/442 | 11 + .../reasoning/runtime/447 | 1 + .../reasoning/runtime/562107 | 12 + .../reasoning/runtime/645662 | 3 + .../reasoning/runtime/693 | 1 + .../reasoning/runtime/695 | 8 + .../reasoning/runtime/697 | 1 + .../reasoning/runtime/698 | 3 + .../reasoning/runtime/754635 | 3 + .../reasoning/runtime/796480 | 5 + .../reasoning/runtime/805 | 7 + .../reasoning/runtime/866 | 3 + .../reasoning/runtime/886621 | 3 + .../reasoning/runtime/909 | 3 + .../reasoning/runtime/922 | 3 + .../reasoning/runtime/939 | 3 + .../reasoning/runtime/95 | 16 + .../reasoning/runtime/967 | 1 + .../reasoning/runtime/979 | 3 + .../reasoning/syscall/1007 | 1 + .../reasoning/syscall/1010 | 3 + .../reasoning/syscall/1012 | 1 + .../reasoning/syscall/1031920 | 3 + .../reasoning/syscall/1033 | 6 + .../reasoning/syscall/1054831 | 7 + .../reasoning/syscall/1066909 | 3 + .../reasoning/syscall/1072 | 3 + .../reasoning/syscall/1075272 | 1 + .../reasoning/syscall/1075339 | 1 + .../reasoning/syscall/1076445 | 5 + .../reasoning/syscall/1111 | 1 + .../reasoning/syscall/1238 | 7 + .../reasoning/syscall/1254672 | 3 + .../reasoning/syscall/1261 | 1 + .../reasoning/syscall/1263747 | 1 + .../reasoning/syscall/127 | 13 + .../reasoning/syscall/1346769 | 3 + .../reasoning/syscall/1356916 | 3 + .../reasoning/syscall/1361 | 1 + .../reasoning/syscall/1394 | 3 + .../reasoning/syscall/1397 | 3 + .../reasoning/syscall/140 | 3 + .../reasoning/syscall/1416988 | 1 + .../reasoning/syscall/1452 | 1 + .../reasoning/syscall/1457275 | 5 + .../reasoning/syscall/1462640 | 3 + .../reasoning/syscall/1470170 | 1 + .../reasoning/syscall/1516408 | 1 + .../reasoning/syscall/1563612 | 1 + .../reasoning/syscall/1585840 | 11 + .../reasoning/syscall/1594394 | 5 + .../reasoning/syscall/1605443 | 1 + .../reasoning/syscall/1619896 | 3 + .../reasoning/syscall/1643619 | 7 + .../reasoning/syscall/1650 | 1 + .../reasoning/syscall/1673976 | 3 + .../reasoning/syscall/1689367 | 1 + .../reasoning/syscall/1696353 | 3 + .../reasoning/syscall/1696773 | 3 + .../reasoning/syscall/1701808 | 1 + .../reasoning/syscall/1701971 | 3 + .../reasoning/syscall/1701973 | 1 + .../reasoning/syscall/1701974 | 1 + .../reasoning/syscall/1707 | 3 + .../reasoning/syscall/1716292 | 3 + .../reasoning/syscall/1716767 | 3 + .../reasoning/syscall/1726394 | 1 + .../reasoning/syscall/1728116 | 3 + .../reasoning/syscall/1729 | 3 + .../reasoning/syscall/1734 | 3 + .../reasoning/syscall/1734792 | 1 + .../reasoning/syscall/1749393 | 1 + .../reasoning/syscall/1756 | 1 + .../reasoning/syscall/1760 | 1 + .../reasoning/syscall/1761153 | 3 + .../reasoning/syscall/1770 | 3 + .../reasoning/syscall/1776478 | 3 + .../reasoning/syscall/1777226 | 1 + .../reasoning/syscall/1783362 | 3 + .../reasoning/syscall/1785203 | 3 + .../reasoning/syscall/1791763 | 3 + .../reasoning/syscall/1791796 | 3 + .../reasoning/syscall/1807 | 3 + .../reasoning/syscall/1808563 | 3 + .../reasoning/syscall/1810433 | 1 + .../reasoning/syscall/1813307 | 7 + .../reasoning/syscall/1821006 | 1 + .../reasoning/syscall/1829459 | 3 + .../reasoning/syscall/1837 | 3 + .../reasoning/syscall/1857811 | 1 + .../reasoning/syscall/1860053 | 3 + .../reasoning/syscall/1861341 | 3 + .../reasoning/syscall/1869241 | 7 + .../reasoning/syscall/1870477 | 3 + .../reasoning/syscall/1876373 | 5 + .../reasoning/syscall/1884719 | 3 + .../reasoning/syscall/1886097 | 5 + .../reasoning/syscall/1887306 | 3 + .../reasoning/syscall/1893010 | 1 + .../reasoning/syscall/1894361 | 1 + .../reasoning/syscall/1910605 | 31 + .../reasoning/syscall/1915925 | 3 + .../reasoning/syscall/1926044 | 3 + .../reasoning/syscall/1926246 | 3 + .../reasoning/syscall/1926521 | 3 + .../reasoning/syscall/1926996 | 1 + .../reasoning/syscall/2112 | 1 + .../reasoning/syscall/2123 | 1 + .../reasoning/syscall/2168 | 11 + .../reasoning/syscall/2170 | 3 + .../reasoning/syscall/2197 | 3 + .../reasoning/syscall/2262 | 3 + .../reasoning/syscall/2333 | 10 + .../reasoning/syscall/2353 | 5 + .../reasoning/syscall/2390 | 3 + .../reasoning/syscall/2410 | 1 + .../reasoning/syscall/2446 | 1 + .../reasoning/syscall/2504 | 3 + .../reasoning/syscall/2592 | 3 + .../reasoning/syscall/2606 | 3 + .../reasoning/syscall/263 | 3 + .../reasoning/syscall/2738 | 3 + .../reasoning/syscall/275 | 3 + .../reasoning/syscall/276 | 3 + .../reasoning/syscall/2825 | 3 + .../reasoning/syscall/326 | 1 + .../reasoning/syscall/356 | 1 + .../reasoning/syscall/456 | 3 + .../reasoning/syscall/470 | 1 + .../reasoning/syscall/570 | 1 + .../reasoning/syscall/577 | 3 + .../reasoning/syscall/578 | 13 + .../reasoning/syscall/579 | 3 + .../reasoning/syscall/602 | 3 + .../reasoning/syscall/633 | 1 + .../reasoning/syscall/654 | 3 + .../reasoning/syscall/690 | 7 + .../reasoning/syscall/704 | 3 + .../reasoning/syscall/714 | 3 + .../reasoning/syscall/817 | 3 + .../reasoning/syscall/833 | 3 + .../reasoning/syscall/834 | 3 + .../reasoning/syscall/836 | 1 + .../reasoning/syscall/856 | 3 + .../reasoning/syscall/871 | 1 + .../reasoning/syscall/885 | 3 + .../reasoning/syscall/911 | 3 + .../reasoning/syscall/927 | 5 + .../reasoning/syscall/957 | 5 + .../reasoning/syscall/982 | 3 + 1103 files changed, 25897 insertions(+) create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/categories.csv create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1028 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1051 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1079080 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1086 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1092 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095531 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095857 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1128 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1129571 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156313 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1178 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/122 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1221966 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1233225 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1245543 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1246990 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1248 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1251 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1254786 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1267 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1267955 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1283519 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1308381 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1328996 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1339 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1361912 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1368 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1370 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1371 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1372 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1373 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1374 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1375 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1376 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1377 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1404690 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1412 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1428352 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1441 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1469342 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1471 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1494 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1541 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1553 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1574346 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1590336 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1594069 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1605123 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1606 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1611394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1612 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1613817 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1620 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1637 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1641637 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1642 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1701821 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1713066 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1722 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1725267 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1727737 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1737 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1738434 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1748296 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1751422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1751494 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1756927 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1761401 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1771 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1779 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1779634 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1780 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1781281 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1785734 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1790 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1793119 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1793608 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1796520 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1806243 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1812451 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1812861 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1815024 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1818075 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1820686 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1821430 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1821444 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1821515 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1824778 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1826568 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1828867 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1832422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1841990 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1847467 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1858415 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1859713 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1860056 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1861404 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1863247 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1873898 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1874888 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1877794 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1883784 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1885350 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1889288 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1892081 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1895471 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1901 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1904210 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1905356 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1907969 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1908 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1909 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1912934 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1914021 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1916269 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1918026 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1922887 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1925512 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1926759 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1927530 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1941 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1955 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2078 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2083 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2089 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2122 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2136 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2175 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2203 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2248 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2302 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2317 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2318 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2319 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2336 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2371 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2372 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2373 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2375 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2376 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2386 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2419 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2474 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2483 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2487 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2497 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2498 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2499 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2500 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2595 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2632 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2647 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/266 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2672 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2696 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2730 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2802 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2865 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2878 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/2971 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/312 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/333 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/361 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/364 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/381 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/390 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/427 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/449 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/494 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/508 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/514 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/616 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/618 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/625 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/754 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/799 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/824 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/826 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/837 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/890 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/904308 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/947 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/952 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/984 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/993 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/instruction/998 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1022 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1550503 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1593 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1617929 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1738545 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1805913 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1824344 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1830 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1833 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1854738 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1858461 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1869782 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1895 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1898954 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1906193 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1908626 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1910 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1915327 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/1967248 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/2374 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/2448 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/2495 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/2553 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/2560 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/306 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/739785 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/manual-review/829 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1010484 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1027 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1034 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1041 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1044 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1052857 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1054812 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1059 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1068900 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1070 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1075 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1093 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1098729 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1102 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1143 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1147 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1165383 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1172613 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1182490 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1187319 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1207896 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1209 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/121 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1211 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1228 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1245703 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1248168 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1254828 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1255 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1261743 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1285363 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1287195 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1294898 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1311614 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1319100 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1346784 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1357206 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1357226 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1362635 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1388 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1429313 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1435 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1478 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1495 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1512 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1519037 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1527765 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1528 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1528239 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1531 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1533141 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1547 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1568107 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1591611 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1603734 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1614348 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1623020 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1641861 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1648 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1654137 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1659901 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1661815 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1667401 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1671 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1697 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1704638 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1715162 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1724485 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1735384 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1736 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1737444 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1740219 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1741 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1748612 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1755 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1756519 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1756807 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1761535 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1763 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1763536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1765970 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1768 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1768246 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1773743 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1774149 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1793539 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1798 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1799200 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1805 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1808565 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1809546 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1812 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1813398 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1814128 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1818483 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1819 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1832353 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1832916 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1833668 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1834496 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1835693 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1835839 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1836078 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1836192 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1836558 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1840922 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1854 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1857 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1860610 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1861605 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1862167 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1862986 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1863445 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1869073 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1878501 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1880225 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1880332 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1880722 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1881450 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1883268 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1888303 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1888728 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1889411 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1890 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1894029 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1895080 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1895305 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1895703 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1904259 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1906536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1907817 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1908551 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1909921 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1913 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1913913 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1914870 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1915531 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1916344 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1917184 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1926202 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1930 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1936977 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1952 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/1953 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2027 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2035 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2072564 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2082 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2101 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2119 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2127 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2156 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2157 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2208 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2223 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2304 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2309 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2460 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2485 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2486 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2505 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2525 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2569 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2580 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2590 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2596 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2598 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2604 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/261 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2619 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2628 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2655 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2683 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2761 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2775 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/280 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2815 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/2846 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/311 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/324 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/355 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/385 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/419 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/442 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/447 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/562107 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/645662 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/693 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/695 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/697 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/698 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/754635 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/796480 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/805 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/866 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/886621 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/909 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/922 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/939 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/95 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/967 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/runtime/979 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1007 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1010 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1012 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1031920 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1033 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1054831 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1066909 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1072 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1075272 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1075339 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1076445 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1111 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1238 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1254672 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1261 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1263747 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/127 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1346769 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1356916 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1361 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1397 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/140 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1416988 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1452 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1457275 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1462640 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1470170 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1516408 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1563612 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1585840 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1594394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1605443 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1619896 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1643619 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1650 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1673976 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1689367 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1696353 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1696773 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1701808 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1701971 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1701973 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1701974 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1707 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1716292 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1716767 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1726394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1728116 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1729 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1734 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1734792 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1749393 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1756 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1760 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1761153 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1770 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1776478 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1777226 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1783362 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1785203 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1791763 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1791796 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1807 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1808563 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1810433 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1813307 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1821006 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1829459 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1837 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1857811 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1860053 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1861341 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1869241 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1870477 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1876373 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1884719 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1886097 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1887306 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1893010 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1894361 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1910605 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1915925 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1926044 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1926246 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1926521 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/1926996 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2112 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2123 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2168 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2170 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2197 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2262 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2333 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2353 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2390 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2410 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2446 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2504 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2592 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2606 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/263 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2738 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/275 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/276 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/2825 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/326 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/356 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/456 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/470 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/570 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/577 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/578 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/579 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/602 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/633 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/654 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/690 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/704 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/714 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/817 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/833 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/834 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/836 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/856 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/871 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/885 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/911 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/927 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/957 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/output/syscall/982 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1028 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1051 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1079080 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1086 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1092 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1095531 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1095857 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1128 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1129571 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1156 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1156313 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1178 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/122 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1221966 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1233225 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1245543 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1246990 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1248 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1251 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1254786 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1267 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1267955 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1283519 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1308381 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1328996 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1339 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1361912 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1368 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1370 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1371 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1372 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1373 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1374 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1375 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1376 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1377 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1404690 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1412 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1428352 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1441 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1469342 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1471 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1494 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1541 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1553 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1574346 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1590336 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1594069 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1605123 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1606 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1611394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1612 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1613817 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1620 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1637 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1641637 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1642 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1701821 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1713066 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1722 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1725267 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1727737 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1737 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1738434 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1748296 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1751422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1751494 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1756927 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1761401 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1771 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1779 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1779634 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1780 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1781281 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1785734 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1790 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1793119 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1793608 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1796520 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1806243 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1812451 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1812861 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1815024 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1818075 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1820686 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1821430 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1821444 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1821515 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1824778 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1826568 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1828867 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1832422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1841990 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1847467 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1858415 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1859713 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1860056 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1861404 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1863247 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1873898 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1874888 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1877794 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1883784 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1885350 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1889288 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1892081 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1895471 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1901 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1904210 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1905356 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1907969 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1908 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1909 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1912934 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1914021 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1916269 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1918026 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1922887 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1925512 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1926759 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1927530 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1941 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/1955 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2078 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2083 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2089 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2122 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2136 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2175 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2203 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2248 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2302 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2317 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2318 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2319 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2336 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2371 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2372 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2373 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2375 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2376 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2386 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2419 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2474 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2483 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2487 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2497 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2498 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2499 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2500 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2595 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2632 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2647 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/266 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2672 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2696 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2730 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2802 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2865 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2878 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/2971 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/312 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/333 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/361 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/364 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/381 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/390 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/422 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/427 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/449 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/494 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/508 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/514 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/616 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/618 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/625 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/754 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/799 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/824 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/826 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/837 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/890 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/904308 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/947 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/952 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/984 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/993 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/instruction/998 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1022 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1550503 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1593 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1617929 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1738545 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1805913 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1824344 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1830 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1833 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1854738 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1858461 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1869782 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1895 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1898954 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1906193 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1908626 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1910 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1915327 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/1967248 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/2374 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/2448 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/2495 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/2553 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/2560 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/306 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/739785 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/manual-review/829 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1010484 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1027 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1034 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1041 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1044 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1052857 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1054812 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1059 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1068900 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1070 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1075 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1093 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1098729 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1102 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1143 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1147 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1165383 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1172613 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1182490 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1187319 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1207896 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1209 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/121 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1211 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1228 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1245703 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1248168 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1254828 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1255 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1261743 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1285363 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1287195 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1294898 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1311614 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1319100 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1346784 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1357206 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1357226 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1362635 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1388 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1429313 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1435 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1478 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1495 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1512 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1519037 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1527765 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1528 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1528239 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1531 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1533141 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1547 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1568107 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1591611 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1603734 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1614348 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1623020 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1641861 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1648 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1654137 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1659901 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1661815 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1667401 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1671 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1697 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1704638 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1715162 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1724485 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1735384 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1736 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1737444 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1740219 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1741 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1748612 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1755 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1756519 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1756807 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1761535 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1763 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1763536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1765970 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1768 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1768246 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1773743 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1774149 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1793539 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1798 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1799200 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1805 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1808565 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1809546 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1812 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1813398 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1814128 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1818483 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1819 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1832353 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1832916 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1833668 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1834496 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1835693 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1835839 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1836078 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1836192 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1836558 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1840922 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1854 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1857 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1860610 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1861605 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1862167 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1862986 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1863445 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1869073 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1878501 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1880225 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1880332 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1880722 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1881450 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1883268 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1888303 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1888728 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1889411 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1890 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1894029 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1895080 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1895305 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1895703 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1904259 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1906536 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1907817 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1908551 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1909921 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1913 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1913913 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1914870 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1915531 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1916344 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1917184 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1926202 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1930 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1936977 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1952 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/1953 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2027 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2035 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2072564 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2082 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2101 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2119 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2127 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2156 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2157 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2208 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2223 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2304 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2309 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2460 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2485 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2486 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2505 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2525 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2569 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2580 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2590 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2596 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2598 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2604 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/261 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2619 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2628 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2655 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2683 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2761 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2775 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/280 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2815 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/2846 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/311 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/324 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/355 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/385 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/419 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/442 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/447 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/562107 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/645662 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/693 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/695 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/697 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/698 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/754635 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/796480 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/805 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/866 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/886621 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/909 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/922 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/939 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/95 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/967 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/runtime/979 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1007 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1010 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1012 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1031920 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1033 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1054831 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1066909 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1072 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1075272 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1075339 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1076445 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1111 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1238 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1254672 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1261 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1263747 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/127 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1346769 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1356916 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1361 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1397 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/140 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1416988 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1452 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1457275 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1462640 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1470170 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1516408 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1563612 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1585840 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1594394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1605443 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1619896 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1643619 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1650 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1673976 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1689367 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1696353 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1696773 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1701808 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1701971 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1701973 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1701974 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1707 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1716292 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1716767 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1726394 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1728116 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1729 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1734 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1734792 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1749393 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1756 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1760 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1761153 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1770 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1776478 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1777226 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1783362 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1785203 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1791763 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1791796 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1807 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1808563 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1810433 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1813307 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1821006 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1829459 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1837 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1857811 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1860053 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1861341 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1869241 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1870477 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1876373 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1884719 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1886097 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1887306 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1893010 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1894361 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1910605 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1915925 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1926044 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1926246 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1926521 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/1926996 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2112 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2123 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2168 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2170 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2197 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2262 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2333 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2353 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2390 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2410 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2446 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2504 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2592 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2606 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/263 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2738 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/275 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/276 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/2825 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/326 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/356 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/456 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/470 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/570 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/577 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/578 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/579 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/602 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/633 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/654 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/690 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/704 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/714 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/817 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/833 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/834 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/836 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/856 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/871 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/885 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/911 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/927 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/957 create mode 100644 results/classifier/no-thinking-deepseek-r1:70b/reasoning/syscall/982 diff --git a/results/classifier/no-thinking-deepseek-r1:70b/categories.csv b/results/classifier/no-thinking-deepseek-r1:70b/categories.csv new file mode 100644 index 00000000..489a55f4 --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/categories.csv @@ -0,0 +1,5 @@ +category, count +syscall, 131 +runtime, 202 +manual-review, 27 +instruction, 191 diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1028 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1028 new file mode 100644 index 00000000..cda1046c --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1028 @@ -0,0 +1,37 @@ + + + +Assert fail for RISC-V RVV vmv.v.x for e64, vl == vl_max on RV32 guest +Description of problem: +assert message: +qemu/tcg/tcg-op-gvec.c:1714: tcg_gen_gvec_dup_i32: Assertion `vece <= MO_32' failed. + +For a e64 vmv.v.x, in the file trans_rvv.c.inc, function "trans_vmv_v_x", when s->vl_eq_vlmax is true, then "tcg_gen_gvec_dup_tl" (it's defined to tcg_gen_gvec_dup_i32 for RV32) is called. In "tcg_gen_gvec_dup_i32" the assert "tcg_debug_assert(vece <= MO_32) will be triggered, since vece == MO_64 for e64. +Steps to reproduce: +1.enable cfg.Zve64f + +2.Prepare a problem as set e64, vl == vl_max and use vmv.v.x, maybe as below +``` + li t0, -1, + vsetvli x0, t0, e64,m1,tu,mu + li t1, -1 + vmv.v.x v0, t1 +``` +Additional information: +Below is a possible solution if it's appropriate. +``` +#if TARGET_LONG_BITS == 32 + if (s->sew == 3) { + TCGv_i64 s1_i64 = tcg_temp_new_i64(); + tcg_gen_ext_tl_i64(s1_i64, s1); + tcg_gen_gvec_dup_i64(s->sew, vreg_ofs(s, a->rd), + MAXSZ(s), MAXSZ(s), s1_i64); + tcg_temp_free_i64(s1_i64); + } else { +#endif + tcg_gen_gvec_dup_tl(s->sew, vreg_ofs(s, a->rd), + MAXSZ(s), MAXSZ(s), s1); +#if TARGET_LONG_BITS == 32 + } +#endif +``` diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1051 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1051 new file mode 100644 index 00000000..fcbf675c --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1051 @@ -0,0 +1,4 @@ + + + +or1k tcg SIGILL diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1079080 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1079080 new file mode 100644 index 00000000..069bd5e2 --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1079080 @@ -0,0 +1,13 @@ + + +ARM instruction "srs" wrong behaviour + +Quote from ARM Architecture Reference Manual ARMv7-A and ARMv7-R : +"Store Return State stores the LR and SPSR of the current mode to the stack of a specified mode" + +Problem: +When executing this instruction, the register stored is CPSR instead of SPSR. + +Context: +Using QEMU 1.2.0 to simulate a Zynq application (processor Cortex-a9 mpcore) with the following command line: +qemu-system-arm -M xilinx-zynq-a9 -m 512 -serial null -serial mon:stdio -dtb /home/vcesson/workspace/xilinx_zynq.dtb -kernel install/tests/io/serial/current/tests/serial2 -S -s -nographic \ No newline at end of file diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1086 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1086 new file mode 100644 index 00000000..56d70a3b --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1086 @@ -0,0 +1,72 @@ + + + +Numpy/scipy test suites fails in QEMU on ppc64le (but not on aarch64) +Description of problem: +I'm not really qualified to report this problem, but after being affected by it for ~2 years (and QEMU 7 not fixing things), I decided to give it a shot. Please excuse reporting deficiencies, I'll endeavour to fix them as best I can once pointed out. + +In my spare time, I help out for the packaging effort in the [conda-forge](https://conda-forge.org/) ecosystem, which is mostly associated/attached to the python world, but - in contrast to the vanilla python tools - also deals with non-python dependencies, and in particular has strong enough abstractions to deal with ABI-issues and generally provides much better integration than the packages on PyPI. + +This strength of abstraction has also allowed conda-forge to publish artefacts for many more architectures than most projects are commonly able to provide precompiled binaries for. Due to the lack of (reliable) public CI for aarch64 & ppc64le, these packages are mostly cross-compiled from linux-x86. Where cross compilation is not possible, the packages are compiled in emulation through QEMU, coming through https://github.com/multiarch/qemu-user-static (this is the part of the infrastructure I don't fully understand myself...). The full infrastructure is somewhat involved, but should not be relevant (hopefully) to the issue at hand (see instructions below) - and even if that turns out to be the case, that would be a great information gain as well. + +In either case, the tests for the package (ideally comprising the entire upstream test suite) are then run in emulation. + +Two of the so-called "feedstocks" I co-maintain are for [numpy](https://github.com/conda-forge/numpy-feedstock) and [scipy](https://github.com/conda-forge/scipy-feedstock), and there have been persistent issues with running the test suite in emulation on PPC (interestingly, the same setup on a different architecture - aarch64 - has no problems). However, the compiled artefacts on PPC run fine on native hardware. + +Said otherwise, it appears numpy/scipy are exercising QEMU enough to uncover some bugs. I've seen similar problems also in other packages (e.g. the cvxpy-stack), reinforcing the impression that this is a QEMU issue, and not one on the level of the individual packages. + +Depending on the exact combination of python version, the result of the numpy test suite might be as follows: +``` +320 failed, 18900 passed, 361 skipped, 36 xfailed, 9 xpassed, 144 warnings in 2516.49s (0:41:56) +``` + +Looking at the test failures, sometimes the results are garbage +``` +> assert_array_max_ulp(x, x+eps, maxulp=20) +E AssertionError: Arrays are not almost equal up to 20 ULP (max difference is 8.55554e+08 ULP) + +eps = 1.1920929e-07 +self = +x = array([ 2.3744986e-38, nan, 2.2482052e-15, 7.5780330e+28, + nan, nan, 5.8310814e+29, -5.6511531e+24, + 1.0010809e+00, 1.0101526e+00], dtype=float32) +``` +sometimes the values are permuted +``` +> assert_array_equal(actual, desired) +E AssertionError: +E Arrays are not equal +E +E x and y nan location mismatch: +E x: array([0.000000e+00, 6.704092e-39, 9.000000e+00, 2.350989e-38, +E 0.000000e+00, 0.000000e+00, 0.000000e+00, 0.000000e+00, +E 6.772341e-39, nan], dtype=float32) +E y: array([6.704092e-39, 6.772341e-39, 0.000000e+00, 0.000000e+00, +E 0.000000e+00, 0.000000e+00, nan, 2.350989e-38, +E 2.000000e+00, 7.000000e+00], dtype=float32) +``` +sometimes the results are fundamentally different (zero vs. non-zero) +``` +> raise AssertionError(msg) +E AssertionError: +E Arrays are not almost equal to 6 decimals +E +E Mismatched elements: 72 / 216 (33.3%) +E Max absolute difference: 1. +E Max relative difference: 1. +E x: array([[[[[0., 0., 0.], +E [0., 0., 0.], +E [0., 0., 0.]],... +E y: array([[[[[1., 0., 0.], +E [0., 1., 0.], +E [0., 0., 1.]],... +``` + +I don't know where it goes wrong, but it's not just a little tolerance violation. One PR that illustrates this is [here](https://github.com/conda-forge/numpy-feedstock/pull/274) and the respective CI run is [here](https://dev.azure.com/conda-forge/feedstock-builds/_build/results?buildId=526218&view=results) (ignore the errors for osx-arm64, those are unrelated). +Steps to reproduce: +1. In an emulated ppc64 machine, install miniforge from [here](https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-ppc64le.sh) +2. Run `conda create -n test_env numpy pytest cython hypothesis typing_extensions` and then `conda activate test_env` +3. Run `python -c "import numpy; numpy.test()"` +4. Pick any test that fails and run it as `python -c "import numpy; numpy.test(tests='x.y.z')"` +Additional information: + diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1092 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1092 new file mode 100644 index 00000000..60c305b4 --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1092 @@ -0,0 +1,17 @@ + + + +PPC: `sraw` instructions does not set `ca` and `ca32` flags. +Description of problem: +The translation of Power PC instruction `sraw` and `sraw.` don't set the `ca` or `ca32` flags although, according to +[PowerISA 3.1b](https://files.openpower.foundation/s/dAYSdGzTfW4j2r2) (page 140), they should. +Additional information: +This gets particular apparent if compared to `srawi` (which does set `ca`, `ca32`). + +**sraw** + +https://gitlab.com/qemu-project/qemu/-/blob/master/target/ppc/translate.c#L2914 + +**srawi** + +https://gitlab.com/qemu-project/qemu/-/blob/master/target/ppc/translate.c#L2924 diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095531 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095531 new file mode 100644 index 00000000..0de5aed7 --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095531 @@ -0,0 +1,60 @@ + + + +sparc32plus (and others?) has x86 code generation errors on 64bit hosts + +On 64bit hosts, the load and store functions compile improperly. The issue is the call to gen_address_mask() under the ld and st functions in target-sparc/translate.c. Below are some snips from the log file. Doing a gdb debug, this results in constant access violation errors which I do not see when debugging qemu in powerpc mode. + +-------------- +IN: +0x0000000040804aa8: st %i0, [ %fp + 0x44 ] + +OP: + ---- 0x40804aa8 + ld_i64 tmp1,regwptr,$0xb0 + mov_i64 tmp0,tmp1 + movi_i64 tmp2,$0x44 + add_i64 tmp0,tmp0,tmp2 + ld_i64 tmp2,regwptr,$0x80 + ext32u_i64 tmp0,tmp0 + qemu_st32 tmp2,tmp0,$0x0 + +OUT: [size=345] +0x6032d7f0: mov 0x40(%r14),%rbp +0x6032d7f4: mov 0xb0(%rbp),%rbx +0x6032d7fb: add $0x44,%rbx +0x6032d7ff: mov 0x80(%rbp),%rbp +0x6032d806: mov %ebx,%ebx <- bug +0x6032d808: mov %ebp,%edi +0x6032d80a: bswap %edi +0x6032d80c: mov %edi,(%rbx) + +-------------- +IN: +0x0000000040804aec: add %l7, %o7, %l7 +0x0000000040804af0: ld [ %l7 ], %g2 + +OP: + ---- 0x40804aec + ld_i64 tmp1,regwptr,$0x78 + ld_i64 tmp2,regwptr,$0x38 + add_i64 tmp0,tmp1,tmp2 + st_i64 tmp0,regwptr,$0x78 + + ---- 0x40804af0 + ld_i64 tmp1,regwptr,$0x78 + mov_i64 tmp0,tmp1 + ext32u_i64 tmp0,tmp0 + qemu_ld32u g2,tmp0,$0x0 + +OUT: [size=395] +0x6032da80: mov 0x40(%r14),%rbp +0x6032da84: mov 0x78(%rbp),%rbx +0x6032da88: mov 0x38(%rbp),%r12 +0x6032da8c: add %r12,%rbx +0x6032da8f: mov %rbx,0x78(%rbp) +0x6032da93: mov 0x78(%rbp),%rbx +0x6032da97: mov %ebx,%ebx <- bug +0x6032da99: mov (%rbx),%ebx + +In 64bit mode, doing a 32bit operation will result in the top 32bit's being zero'd. I attempted to simply disable the call to gen_address_mask() but that did not fix the issue and actually caused the sparc32plus I was testing to become unusable. \ No newline at end of file diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095857 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095857 new file mode 100644 index 00000000..c8282590 --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1095857 @@ -0,0 +1,14 @@ + + + +incorrect handling of [r32] address (long mode) + +while executing in Long Mode (x86-64) instructions such as + +mov eax,[r15d] + +end up executing as + +mov eax,[r15] + +according to x86 programmer manuals the behavior of using the Address-Size override (in long mode) is supposed to ignore the high 32bits of the register. I use this fact in my operating system to reduce register usage (the high 32 bits of r15 holds other data). consequently a general protection exception occurs since the memory address isn't "canonical". this error doesn't always appear since the high 32 bits might not be zero in those conditions. \ No newline at end of file diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1128 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1128 new file mode 100644 index 00000000..902f0baf --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1128 @@ -0,0 +1,27 @@ + + + +PPC: `spr_write_xer` doesn't set flag bits in `cpu_xer` +Description of problem: +`spr_write_xer()` does not set the `ca`, `ov`, `so`, `ca32`, `ov32` etc. flag bits in the `cpu_xer` variable. + +In fact it copies all bits from the source `GPR` and _excludes_ each flag bit. + +This is not a problem for execution since `spr_read_xer()` gets the flag bits from `cpu_ca/ov/so...` and not from `cpu_xer`. + +Nonetheless it is problem for tools which trace the execution in QEMU (e.g. https://github.com/BinaryAnalysisPlatform/qemu). + +A fix would be to remove the `~` in https://gitlab.com/qemu-project/qemu/-/blob/master/target/ppc/translate.c#L481 +Steps to reproduce: +Haven't found out yet how to debug QEMU so the TCGv values can be investigated. But in general one need to: + +- Execute a binary which executes something like: +``` +r4 = 0xffffffffffffffff +mtxer r4 +``` +and check the `cpu_xer` value after the `xer` write. + +Checking the debug logs (`in_asm,cpu`) doesn't work, since the `xer` value in the logs is not taken directly from `cpu_xer`. +Additional information: +Code ref: https://gitlab.com/qemu-project/qemu/-/blob/master/target/ppc/translate.c#L480-L483 diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1129571 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1129571 new file mode 100644 index 00000000..dc66da3b --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1129571 @@ -0,0 +1,17 @@ + + + +libreoffice armhf FTBFS + +We have been experiencing FTBFS of LibreOffice 3.5.7, 12.04, armhf in the launchpad buildds. We believe this is likely due to an error in qemu. + +While we do not have a small test case yet, we do have a build log (attaching here). + +The relevant snippet from the build log is: + +3.5.7/solver/unxlngr.pro/bin/jaxp.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/juh.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/parser.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/xt.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/unoil.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/ridl.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/jurt.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/xmlsearch.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/LuceneHelpWrapper.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/HelpIndexerTool.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/lucene-core-2.3.jar:/build/buildd/libreoffice-3.5.7/solver/unxlngr.pro/bin/lucene-analyzers-2.3.jar" com.sun.star.help.HelpIndexerTool -lang cs -mod swriter -zipdir ../../unxlngr.pro/misc/ziptmpswriter_cs -o ../../unxlngr.pro/bin/swriter_cs.zip.unxlngr.pro +dmake: Error code 132, while making '../../unxlngr.pro/bin/swriter_cs.zip' + +We believe this is from bash error code 128 + 4, where 4 is illegal instruction, thus leading us to suspect qemu. + +Any help in tracking this down would be appreciated. \ No newline at end of file diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156 new file mode 100644 index 00000000..76296a60 --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156 @@ -0,0 +1,4 @@ + + + +Incorrect implementation of vmsumudm instruction diff --git a/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156313 b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156313 new file mode 100644 index 00000000..76a0b70e --- /dev/null +++ b/results/classifier/no-thinking-deepseek-r1:70b/output/instruction/1156313 @@ -0,0 +1,129 @@ + +semantic: 0.869 +mistranslation: 0.841 +assembly: 0.789 +device: 0.777 +instruction: 0.707 +other: 0.705 +vnc: 0.702 +graphic: 0.657 +socket: 0.605 +boot: 0.576 +network: 0.533 +KVM: 0.518 + +X86-64 flags handling broken + +The current qemu sources cause improper handling of flags on x86-64. +This bug seems to have shown up a few weeks ago. + +A plain install of Debian GNU/Linux makes user processes catch +spurious signals. The kernel seems to run stably, though. + +The ADX feature works very poorly. It might be related; at least it +allows for reproducibly provoking invalid behaviour. + +Here is a test case: + +================================================================ +qemumain.c +#include +long adx(); +int +main () +{ + printf ("%lx\n", adx (0xffbeef, 17)); + return 0; +} +================================================================ +qemuadx.s: + .globl adx +adx: xor %rax, %rax +1: dec %rdi + jnz 1b + .byte 0xf3, 0x48, 0x0f, 0x38, 0xf6, 0xc0 # adox %rax, %rax + .byte 0x66, 0x48, 0x0f, 0x38, 0xf6, 0xc0 # adcx %rax, %rax + ret +================================================================ + +Compile and execute: +$ gcc -m64 qemumain.c qemuadx.s +$ a.out +ffffff8000378cd8 + +Expected output is simply "0". The garbage value varies between qemu +compiles and guest systems. + +Note that one needs a recent GNU assembler in order to handle adox and +adcx. For convenience I have supplied them as byte sequences. + +Exaplanation and feeble analysis: + +The 0xffbeef argument is a loop count. It is necessary to loop for a +while in order to trigger this bug. If the loop count is decreased, +the bug will seen intermittently; the lower the count, the less +frequent the invalid behaviour. + +It seems like a reasonable assumption that this bug is related to +flags handling at context switch. Presumably, qemu keeps flags state +in some internal format, then recomputes then when needing to form the +eflags register, as needed for example for context switching. + +I haven't tried to reproduce this bug using qemu-x86_64 and SYSROOT, +but I strongly suspect that to be impossible. I use +qemu-system-x86_64 and the guest Debian GNU/Linux x86_64 (version +6.0.6) . + +The bug happens also with the guest FreeBSD x86_64 version 9.1. (The +iteration count for triggering the problem 50% of the runs is not the +same when using the kernel Linux and FreeBSD's kernel, presumably due +to different ticks.) + +The bug happens much more frequently for a loaded system; in fact, the +loop count can be radically decreased if two instances of the trigger +program are run in parallel. + +Richard Henderson