why did i ever chose to do IB

This commit is contained in:
2025-04-29 23:10:24 -05:00
parent 3188a05c6a
commit cda8b28b7e
7 changed files with 706 additions and 79 deletions

View File

@@ -26,6 +26,13 @@
\abx@aux@segm{0}{0}{cobbe2021trainingverifierssolvemath}
\abx@aux@cite{0}{cobbe2021trainingverifierssolvemath}
\abx@aux@segm{0}{0}{cobbe2021trainingverifierssolvemath}
\abx@aux@read@bbl@mdfivesum{nohash}
\abx@aux@read@bblrerun
\gdef \@abspage@last{8}
\abx@aux@read@bbl@mdfivesum{DB874CC7E8DA7002F79589CE78CE1348}
\abx@aux@defaultrefcontext{0}{ahn2024largelanguagemodelsmathematical}{nty/global//global/global/global}
\abx@aux@defaultrefcontext{0}{cobbe2021trainingverifierssolvemath}{nty/global//global/global/global}
\abx@aux@defaultrefcontext{0}{hendrycks2021measuringmathematicalproblemsolving}{nty/global//global/global/global}
\abx@aux@defaultrefcontext{0}{hoffmann2022trainingcomputeoptimallargelanguage}{nty/global//global/global/global}
\abx@aux@defaultrefcontext{0}{ivanov2024}{nty/global//global/global/global}
\abx@aux@defaultrefcontext{0}{app14020744}{nty/global//global/global/global}
\abx@aux@defaultrefcontext{0}{vaswani2023attentionneed}{nty/global//global/global/global}
\abx@aux@defaultrefcontext{0}{Wang2024}{nty/global//global/global/global}
\gdef \@abspage@last{9}

650
EEMLA.bbl Normal file
View File

@@ -0,0 +1,650 @@
% $ biblatex auxiliary file $
% $ biblatex bbl format version 3.3 $
% Do not modify the above lines!
%
% This is an auxiliary file used by the 'biblatex' package.
% This file may safely be deleted. It will be recreated by
% biber as required.
%
\begingroup
\makeatletter
\@ifundefined{ver@biblatex.sty}
{\@latex@error
{Missing 'biblatex' package}
{The bibliography requires the 'biblatex' package.}
\aftergroup\endinput}
{}
\endgroup
\refsection{0}
\datalist[entry]{nty/global//global/global/global}
\entry{ahn2024largelanguagemodelsmathematical}{misc}{}{}
\name{author}{6}{}{%
{{un=0,uniquepart=base,hash=55b43626068d5d974748659fe7e69f14}{%
family={Ahn},
familyi={A\bibinitperiod},
given={Janice},
giveni={J\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=203a45aabbe5b6981d4d994a6b800a64}{%
family={Verma},
familyi={V\bibinitperiod},
given={Rishu},
giveni={R\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=b5577bb26d2577f3382a51e640893655}{%
family={Lou},
familyi={L\bibinitperiod},
given={Renze},
giveni={R\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=b57a1b9e5665c3bf5033c8cfe0f7e3ca}{%
family={Liu},
familyi={L\bibinitperiod},
given={Di},
giveni={D\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=0672466dc7c3a8cec050e5ac091fd0ac}{%
family={Zhang},
familyi={Z\bibinitperiod},
given={Rui},
giveni={R\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=f04e25a79b81d6565c2d598e1fd5fa2e}{%
family={Yin},
familyi={Y\bibinitperiod},
given={Wenpeng},
giveni={W\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{db73145580b1257f9bbc80ac70bfb8af}
\strng{fullhash}{f4f3169ad9e4481309df17e741ebdcd5}
\strng{fullhashraw}{f4f3169ad9e4481309df17e741ebdcd5}
\strng{bibnamehash}{db73145580b1257f9bbc80ac70bfb8af}
\strng{authorbibnamehash}{db73145580b1257f9bbc80ac70bfb8af}
\strng{authornamehash}{db73145580b1257f9bbc80ac70bfb8af}
\strng{authorfullhash}{f4f3169ad9e4481309df17e741ebdcd5}
\strng{authorfullhashraw}{f4f3169ad9e4481309df17e741ebdcd5}
\field{sortinit}{A}
\field{sortinithash}{2f401846e2029bad6b3ecc16d50031e2}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{eprintclass}{cs.CL}
\field{eprinttype}{arXiv}
\field{title}{Large Language Models for Mathematical Reasoning: Progresses and Challenges}
\field{year}{2024}
\verb{eprint}
\verb 2402.00157
\endverb
\verb{urlraw}
\verb arxiv.org/abs/2402.00157
\endverb
\verb{url}
\verb arxiv.org/abs/2402.00157
\endverb
\endentry
\entry{cobbe2021trainingverifierssolvemath}{misc}{}{}
\name{author}{12}{}{%
{{un=0,uniquepart=base,hash=c9355eeb51a7665fc3d58f45e210fbf6}{%
family={Cobbe},
familyi={C\bibinitperiod},
given={Karl},
giveni={K\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=da0f106450b289c3010ca569b3de9949}{%
family={Kosaraju},
familyi={K\bibinitperiod},
given={Vineet},
giveni={V\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=69471b8ab1a1d92877d0dfe5f57411e3}{%
family={Bavarian},
familyi={B\bibinitperiod},
given={Mohammad},
giveni={M\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=fb15a691583ec94aafe0be6e7da4878f}{%
family={Chen},
familyi={C\bibinitperiod},
given={Mark},
giveni={M\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=3dd736ee38ff1cbcc6f0d05487b9950b}{%
family={Jun},
familyi={J\bibinitperiod},
given={Heewoo},
giveni={H\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=f2bc899b1160163417da7bf510f15d33}{%
family={Kaiser},
familyi={K\bibinitperiod},
given={Lukasz},
giveni={L\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=599240d5bfe42aeb65a0c26dae77cd31}{%
family={Plappert},
familyi={P\bibinitperiod},
given={Matthias},
giveni={M\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=98cbd7022a1c31a6293aa1c8b62bdebf}{%
family={Tworek},
familyi={T\bibinitperiod},
given={Jerry},
giveni={J\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=9e4edc142b0564cbbb1cf93a401e4434}{%
family={Hilton},
familyi={H\bibinitperiod},
given={Jacob},
giveni={J\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=13b885c1233d3f59261e0e53ec1aece0}{%
family={Nakano},
familyi={N\bibinitperiod},
given={Reiichiro},
giveni={R\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=68a04c5006dbbf98f7719709540c6b56}{%
family={Hesse},
familyi={H\bibinitperiod},
given={Christopher},
giveni={C\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=3e09bd2a25d237ebdaed560a07c0451e}{%
family={Schulman},
familyi={S\bibinitperiod},
given={John},
giveni={J\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{45858a0ae98644e6c6bc549ac1a2cfa3}
\strng{fullhash}{2b1c5987decdf5a17625aab169f4133e}
\strng{fullhashraw}{2b1c5987decdf5a17625aab169f4133e}
\strng{bibnamehash}{45858a0ae98644e6c6bc549ac1a2cfa3}
\strng{authorbibnamehash}{45858a0ae98644e6c6bc549ac1a2cfa3}
\strng{authornamehash}{45858a0ae98644e6c6bc549ac1a2cfa3}
\strng{authorfullhash}{2b1c5987decdf5a17625aab169f4133e}
\strng{authorfullhashraw}{2b1c5987decdf5a17625aab169f4133e}
\field{sortinit}{C}
\field{sortinithash}{4d103a86280481745c9c897c925753c0}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{eprintclass}{cs.LG}
\field{eprinttype}{arXiv}
\field{title}{Training Verifiers to Solve Math Word Problems}
\field{year}{2021}
\verb{eprint}
\verb 2110.14168
\endverb
\verb{urlraw}
\verb arxiv.org/abs/2110.14168
\endverb
\verb{url}
\verb arxiv.org/abs/2110.14168
\endverb
\endentry
\entry{hendrycks2021measuringmathematicalproblemsolving}{misc}{}{}
\name{author}{8}{}{%
{{un=0,uniquepart=base,hash=86d0b4ecd6b6066d49e7aecde6e5e630}{%
family={Hendrycks},
familyi={H\bibinitperiod},
given={Dan},
giveni={D\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=624605ebd8b6b403b251522e3d1029ff}{%
family={Burns},
familyi={B\bibinitperiod},
given={Collin},
giveni={C\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=ae50339c3e9c1418ade64e74fa002ef5}{%
family={Kadavath},
familyi={K\bibinitperiod},
given={Saurav},
giveni={S\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=a3e8b92acb1bf8b2b186f6b10d4ae704}{%
family={Arora},
familyi={A\bibinitperiod},
given={Akul},
giveni={A\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=35f72302a7aebfd095414ce218b8fb5d}{%
family={Basart},
familyi={B\bibinitperiod},
given={Steven},
giveni={S\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=ffd1907ef0a8bbed89fa04d783f236b6}{%
family={Tang},
familyi={T\bibinitperiod},
given={Eric},
giveni={E\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=d458d5f9b64652055bd81d57e4777b22}{%
family={Song},
familyi={S\bibinitperiod},
given={Dawn},
giveni={D\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=fe7a7e80c1857d185d3ab01f15fe584d}{%
family={Steinhardt},
familyi={S\bibinitperiod},
given={Jacob},
giveni={J\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{f461c117afa272374439d2db3ee67282}
\strng{fullhash}{821f0c67ea3dbc37f0422b8c2bda174e}
\strng{fullhashraw}{821f0c67ea3dbc37f0422b8c2bda174e}
\strng{bibnamehash}{f461c117afa272374439d2db3ee67282}
\strng{authorbibnamehash}{f461c117afa272374439d2db3ee67282}
\strng{authornamehash}{f461c117afa272374439d2db3ee67282}
\strng{authorfullhash}{821f0c67ea3dbc37f0422b8c2bda174e}
\strng{authorfullhashraw}{821f0c67ea3dbc37f0422b8c2bda174e}
\field{sortinit}{H}
\field{sortinithash}{23a3aa7c24e56cfa16945d55545109b5}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{eprintclass}{cs.LG}
\field{eprinttype}{arXiv}
\field{title}{Measuring Mathematical Problem Solving With the MATH Dataset}
\field{year}{2021}
\verb{eprint}
\verb 2103.03874
\endverb
\verb{urlraw}
\verb arxiv.org/abs/2103.03874
\endverb
\verb{url}
\verb arxiv.org/abs/2103.03874
\endverb
\endentry
\entry{hoffmann2022trainingcomputeoptimallargelanguage}{misc}{}{}
\name{author}{22}{}{%
{{un=0,uniquepart=base,hash=92d226c4ea870c0e9df2ceb8bf03d8ff}{%
family={Hoffmann},
familyi={H\bibinitperiod},
given={Jordan},
giveni={J\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=c28d74501d531d6672ccf4c28016c7ac}{%
family={Borgeaud},
familyi={B\bibinitperiod},
given={Sebastian},
giveni={S\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=e9a587c57b1dcb4834850800386d8aca}{%
family={Mensch},
familyi={M\bibinitperiod},
given={Arthur},
giveni={A\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=eee8c4b85d5c4e1f4bc70218d34ba69d}{%
family={Buchatskaya},
familyi={B\bibinitperiod},
given={Elena},
giveni={E\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=3d7a83ed6eb983ca17cec804631dc22e}{%
family={Cai},
familyi={C\bibinitperiod},
given={Trevor},
giveni={T\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=5cc07c10e9f1ef5fae367662553d982c}{%
family={Rutherford},
familyi={R\bibinitperiod},
given={Eliza},
giveni={E\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=47f81e65396e1d91b7ab70d59f69329b}{%
family={Las\bibnamedelima Casas},
familyi={L\bibinitperiod\bibinitdelim C\bibinitperiod},
given={Diego},
giveni={D\bibinitperiod},
givenun=0,
prefix={de},
prefixi={d\bibinitperiod}}}%
{{un=0,uniquepart=base,hash=68b917d11d355ed641ee448751fb3ba5}{%
family={Hendricks},
familyi={H\bibinitperiod},
given={Lisa\bibnamedelima Anne},
giveni={L\bibinitperiod\bibinitdelim A\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=7a7fdb4cb72d04e1eaa8a6a2ca0358dc}{%
family={Welbl},
familyi={W\bibinitperiod},
given={Johannes},
giveni={J\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=b06242c53973106520ab19f8e1fc3799}{%
family={Clark},
familyi={C\bibinitperiod},
given={Aidan},
giveni={A\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=0c1f2b1cf15f9e15216a9e652512bf6f}{%
family={Hennigan},
familyi={H\bibinitperiod},
given={Tom},
giveni={T\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=70b3914180795f8c87317cbd0599c942}{%
family={Noland},
familyi={N\bibinitperiod},
given={Eric},
giveni={E\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=da626c813aa81825001015989a23f850}{%
family={Millican},
familyi={M\bibinitperiod},
given={Katie},
giveni={K\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=54c5c572d4fdc5d822c240b59fcadad4}{%
family={Driessche},
familyi={D\bibinitperiod},
given={George},
giveni={G\bibinitperiod},
givenun=0,
prefix={van\bibnamedelima den},
prefixi={v\bibinitperiod\bibinitdelim d\bibinitperiod}}}%
{{un=0,uniquepart=base,hash=4da5c824138e58f9def8fd792b5ad94f}{%
family={Damoc},
familyi={D\bibinitperiod},
given={Bogdan},
giveni={B\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=8bc2c63cf1c4c6e9e4d317839dda4de2}{%
family={Guy},
familyi={G\bibinitperiod},
given={Aurelia},
giveni={A\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=643f92e8f89f2746a4c1aa077d225755}{%
family={Osindero},
familyi={O\bibinitperiod},
given={Simon},
giveni={S\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=9d16b7284df92c9adaee86c37ab992df}{%
family={Simonyan},
familyi={S\bibinitperiod},
given={Karen},
giveni={K\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=6aa92a937d4d30dd0b5ec0eecbad1bf1}{%
family={Elsen},
familyi={E\bibinitperiod},
given={Erich},
giveni={E\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=8dcdeb16ef3c68cf8396226668804fe0}{%
family={Rae},
familyi={R\bibinitperiod},
given={Jack\bibnamedelima W.},
giveni={J\bibinitperiod\bibinitdelim W\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=494b568c5dc85ba8f3f409635f9c5f25}{%
family={Vinyals},
familyi={V\bibinitperiod},
given={Oriol},
giveni={O\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=50d24de916599d306c5cb1a77156e4b9}{%
family={Sifre},
familyi={S\bibinitperiod},
given={Laurent},
giveni={L\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{8be79936575bb0d5b77c96da6d2a6d52}
\strng{fullhash}{fb6d92421541c28738787855a47da527}
\strng{fullhashraw}{fb6d92421541c28738787855a47da527}
\strng{bibnamehash}{8be79936575bb0d5b77c96da6d2a6d52}
\strng{authorbibnamehash}{8be79936575bb0d5b77c96da6d2a6d52}
\strng{authornamehash}{8be79936575bb0d5b77c96da6d2a6d52}
\strng{authorfullhash}{fb6d92421541c28738787855a47da527}
\strng{authorfullhashraw}{fb6d92421541c28738787855a47da527}
\field{sortinit}{H}
\field{sortinithash}{23a3aa7c24e56cfa16945d55545109b5}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{eprintclass}{cs.CL}
\field{eprinttype}{arXiv}
\field{title}{Training Compute-Optimal Large Language Models}
\field{year}{2022}
\verb{eprint}
\verb 2203.15556
\endverb
\verb{urlraw}
\verb arxiv.org/abs/2203.15556
\endverb
\verb{url}
\verb arxiv.org/abs/2203.15556
\endverb
\endentry
\entry{ivanov2024}{misc}{}{}
\name{author}{2}{}{%
{{un=0,uniquepart=base,hash=1935b6f0043d4bac823842ff5d478faf}{%
family={Ivanov},
familyi={I\bibinitperiod},
given={Todor},
giveni={T\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=495d2036e580863cb79ad80a7bb2fc78}{%
family={Penchev},
familyi={P\bibinitperiod},
given={Valeri},
giveni={V\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{259e51507bbcab245b7267c088c1998f}
\strng{fullhash}{259e51507bbcab245b7267c088c1998f}
\strng{fullhashraw}{259e51507bbcab245b7267c088c1998f}
\strng{bibnamehash}{259e51507bbcab245b7267c088c1998f}
\strng{authorbibnamehash}{259e51507bbcab245b7267c088c1998f}
\strng{authornamehash}{259e51507bbcab245b7267c088c1998f}
\strng{authorfullhash}{259e51507bbcab245b7267c088c1998f}
\strng{authorfullhashraw}{259e51507bbcab245b7267c088c1998f}
\field{sortinit}{I}
\field{sortinithash}{8d291c51ee89b6cd86bf5379f0b151d8}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{eprintclass}{cs.DC}
\field{eprinttype}{arXiv}
\field{title}{AI Benchmarks and Datasets for LLM Evaluation}
\field{year}{2024}
\verb{eprint}
\verb 2412.01020
\endverb
\verb{urlraw}
\verb arxiv.org/abs/2412.01020
\endverb
\verb{url}
\verb arxiv.org/abs/2412.01020
\endverb
\endentry
\entry{app14020744}{article}{}{}
\name{author}{1}{}{%
{{un=0,uniquepart=base,hash=d8c43e5429158fe51408ffa847a4a856}{%
family={Testolin},
familyi={T\bibinitperiod},
given={Alberto},
giveni={A\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{d8c43e5429158fe51408ffa847a4a856}
\strng{fullhash}{d8c43e5429158fe51408ffa847a4a856}
\strng{fullhashraw}{d8c43e5429158fe51408ffa847a4a856}
\strng{bibnamehash}{d8c43e5429158fe51408ffa847a4a856}
\strng{authorbibnamehash}{d8c43e5429158fe51408ffa847a4a856}
\strng{authornamehash}{d8c43e5429158fe51408ffa847a4a856}
\strng{authorfullhash}{d8c43e5429158fe51408ffa847a4a856}
\strng{authorfullhashraw}{d8c43e5429158fe51408ffa847a4a856}
\field{sortinit}{T}
\field{sortinithash}{9af77f0292593c26bde9a56e688eaee9}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{abstract}{Creating learning models that can exhibit sophisticated reasoning abilities is one of the greatest challenges in deep learning research, and mathematics is rapidly becoming one of the target domains for assessing scientific progress in this direction. In the past few years there has been an explosion of neural network architectures, datasets, and benchmarks specifically designed to tackle mathematical problems, reporting impressive achievements in disparate fields such as automated theorem proving, numerical integration, and the discovery of new conjectures or matrix multiplication algorithms. However, despite this notable success it is still unclear whether deep learning models possess an elementary understanding of quantities and numbers. This survey critically examines the recent literature, concluding that even state-of-the-art architectures and large language models often fall short when probed with relatively simple tasks designed to test basic numerical and arithmetic knowledge.}
\field{issn}{2076-3417}
\field{journaltitle}{Applied Sciences}
\field{number}{2}
\field{title}{Can Neural Networks Do Arithmetic? A Survey on the Elementary Numerical Skills of State-of-the-Art Deep Learning Models}
\field{volume}{14}
\field{year}{2024}
\verb{doi}
\verb 10.3390/app14020744
\endverb
\endentry
\entry{vaswani2023attentionneed}{misc}{}{}
\name{author}{8}{}{%
{{un=0,uniquepart=base,hash=7f28e84700536646dd6620a0db07ad09}{%
family={Vaswani},
familyi={V\bibinitperiod},
given={Ashish},
giveni={A\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=62efade83d70f0323fe248755e6c90c5}{%
family={Shazeer},
familyi={S\bibinitperiod},
given={Noam},
giveni={N\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=06649ebab1ea5cac0250746a19764975}{%
family={Parmar},
familyi={P\bibinitperiod},
given={Niki},
giveni={N\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=831027ee0ebf22375e2a86afc1881909}{%
family={Uszkoreit},
familyi={U\bibinitperiod},
given={Jakob},
giveni={J\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=2fd2982e30ebcec93ec1cf76e0d797fd}{%
family={Jones},
familyi={J\bibinitperiod},
given={Llion},
giveni={L\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=27b07e4eacbf4ef7a1438e3badb7dd8d}{%
family={Gomez},
familyi={G\bibinitperiod},
given={Aidan\bibnamedelima N.},
giveni={A\bibinitperiod\bibinitdelim N\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=f2bc899b1160163417da7bf510f15d33}{%
family={Kaiser},
familyi={K\bibinitperiod},
given={Lukasz},
giveni={L\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=95595a0fefb86187cbc36e551017d332}{%
family={Polosukhin},
familyi={P\bibinitperiod},
given={Illia},
giveni={I\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{ee273ab30cfb889666f8c4d806eb9ce7}
\strng{fullhash}{f82970bbd2bdd7a002d2af62b743d5cc}
\strng{fullhashraw}{f82970bbd2bdd7a002d2af62b743d5cc}
\strng{bibnamehash}{ee273ab30cfb889666f8c4d806eb9ce7}
\strng{authorbibnamehash}{ee273ab30cfb889666f8c4d806eb9ce7}
\strng{authornamehash}{ee273ab30cfb889666f8c4d806eb9ce7}
\strng{authorfullhash}{f82970bbd2bdd7a002d2af62b743d5cc}
\strng{authorfullhashraw}{f82970bbd2bdd7a002d2af62b743d5cc}
\field{sortinit}{V}
\field{sortinithash}{afb52128e5b4dc4b843768c0113d673b}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{eprintclass}{cs.CL}
\field{eprinttype}{arXiv}
\field{title}{Attention Is All You Need}
\field{year}{2023}
\verb{eprint}
\verb 1706.03762
\endverb
\verb{urlraw}
\verb arxiv.org/abs/1706.03762
\endverb
\verb{url}
\verb arxiv.org/abs/1706.03762
\endverb
\endentry
\entry{Wang2024}{article}{}{}
\name{author}{6}{}{%
{{un=0,uniquepart=base,hash=7cca10cee48e9c197439e4af610acfe5}{%
family={Wang},
familyi={W\bibinitperiod},
given={Zichong},
giveni={Z\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=bc41c1f771e246b6d8ce744badb182e3}{%
family={Chu},
familyi={C\bibinitperiod},
given={Zhibo},
giveni={Z\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=82b0035db67db8bd400c34e8a5eec07b}{%
family={Doan},
familyi={D\bibinitperiod},
given={Thang\bibnamedelima Viet},
giveni={T\bibinitperiod\bibinitdelim V\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=852b650254c75a15c1024df13b29189c}{%
family={Ni},
familyi={N\bibinitperiod},
given={Shiwen},
giveni={S\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=feb96ca112c179e320db2db693e022b8}{%
family={Yang},
familyi={Y\bibinitperiod},
given={Min},
giveni={M\bibinitperiod},
givenun=0}}%
{{un=0,uniquepart=base,hash=dd4baede28b306ab6d37dd79d89a935b}{%
family={Zhang},
familyi={Z\bibinitperiod},
given={Wenbin},
giveni={W\bibinitperiod},
givenun=0}}%
}
\strng{namehash}{1c3e58e991d8f7a6ae5aee1e95c5cd8a}
\strng{fullhash}{391aec39c1c26e8d5e7517c1ab227456}
\strng{fullhashraw}{391aec39c1c26e8d5e7517c1ab227456}
\strng{bibnamehash}{1c3e58e991d8f7a6ae5aee1e95c5cd8a}
\strng{authorbibnamehash}{1c3e58e991d8f7a6ae5aee1e95c5cd8a}
\strng{authornamehash}{1c3e58e991d8f7a6ae5aee1e95c5cd8a}
\strng{authorfullhash}{391aec39c1c26e8d5e7517c1ab227456}
\strng{authorfullhashraw}{391aec39c1c26e8d5e7517c1ab227456}
\field{sortinit}{W}
\field{sortinithash}{4315d78024d0cea9b57a0c6f0e35ed0d}
\true{singletitle}
\field{labelnamesource}{author}
\field{labeltitlesource}{title}
\field{journaltitle}{AI and Ethics}
\field{month}{10}
\field{title}{History, development, and principles of large language models: An introductory survey}
\field{year}{2024}
\verb{doi}
\verb 10.1007/s43681-024-00583-7
\endverb
\endentry
\enddatalist
\endrefsection
\endinput

View File

@@ -1,5 +1,17 @@
[0] Config.pm:308> INFO - This is Biber 2.20
[0] Config.pm:311> INFO - Logfile is 'EEMLA.blg'
[39] biber:340> INFO - === Tue Apr 29, 2025, 22:30:03
[47] Utils.pm:410> ERROR - EEMLA.bcf is malformed, last biblatex run probably failed. Deleted EEMLA.bbl
[47] Biber.pm:136> INFO - ERRORS: 1
[38] biber:340> INFO - === Tue Apr 29, 2025, 23:04:30
[46] Biber.pm:420> INFO - Reading 'EEMLA.bcf'
[81] Biber.pm:994> INFO - Found 8 citekeys in bib section 0
[89] Biber.pm:4463> INFO - Processing section 0
[93] Biber.pm:4654> INFO - Looking for bibtex file 'references.bib' for section 0
[94] bibtex.pm:1713> INFO - LaTeX decoding ...
[97] bibtex.pm:1519> INFO - Found BibTeX data source 'references.bib'
[171] UCollate.pm:68> INFO - Overriding locale 'en-US' defaults 'normalization = NFD' with 'normalization = prenormalized'
[171] UCollate.pm:68> INFO - Overriding locale 'en-US' defaults 'variable = shifted' with 'variable = non-ignorable'
[171] Biber.pm:4283> INFO - Sorting list 'nty/global//global/global/global' of type 'entry' with template 'nty' and locale 'en-US'
[171] Biber.pm:4289> INFO - No sort tailoring available for locale 'en-US'
[177] bbl.pm:676> INFO - Writing 'EEMLA.bbl' with encoding 'UTF-8'
[181] bbl.pm:779> INFO - Output to EEMLA.bbl
[181] Biber.pm:131> WARN - legacy month field 'Oct' in entry 'Wang2024' is not an integer - this will probably not sort properly.
[181] Biber.pm:133> INFO - WARNINGS: 1

View File

@@ -1,4 +1,4 @@
This is pdfTeX, Version 3.141592653-2.6-1.40.27 (TeX Live 2026/dev/Arch Linux) (preloaded format=pdflatex 2025.4.29) 29 APR 2025 22:30
This is pdfTeX, Version 3.141592653-2.6-1.40.27 (TeX Live 2026/dev/Arch Linux) (preloaded format=pdflatex 2025.4.29) 29 APR 2025 23:04
entering extended mode
restricted \write18 enabled.
%&-line parsing enabled.
@@ -556,11 +556,11 @@ Package biblatex Info: Automatic encoding selection.
\openout3 = `EEMLA.bcf'.
Package biblatex Info: Trying to load bibliographic data...
Package biblatex Info: ... file 'EEMLA.bbl' not found.
No file EEMLA.bbl.
Package biblatex Info: ... file 'EEMLA.bbl' found.
(./EEMLA.bbl)
Package biblatex Info: Reference section=0 on input line 57.
Package biblatex Info: Reference segment=0 on input line 57.
(/usr/share/texmf-dist/tex/context/base/mkii/supp-pdf.mkii
[Loading MPS to PDF converter (version 2006.09.02).]
\scratchcounter=\count418
@@ -595,10 +595,6 @@ File: epstopdf-sys.cfg 2010/07/13 v1.3 Configuration of (r)epstopdf for TeX Liv
e
))
LaTeX Warning: Citation 'app14020744' on page 1 undefined on input line 80.
Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) Make it at least 14.49998pt, for example:
@@ -611,17 +607,6 @@ ts/enc/dvips/base/8r.enc}
]
LaTeX Warning: Citation 'Wang2024' on page 2 undefined on input line 90.
LaTeX Warning: Citation 'vaswani2023attentionneed' on page 2 undefined on input
line 90.
LaTeX Warning: Citation 'Wang2024' on page 2 undefined on input line 92.
Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) Make it at least 14.49998pt, for example:
@@ -631,13 +616,6 @@ Package fancyhdr Warning: \headheight is too small (12.0pt):
[2]
LaTeX Warning: Citation 'ivanov2024' on page 3 undefined on input line 104.
LaTeX Warning: Citation 'ivanov2024' on page 3 undefined on input line 104.
Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) Make it at least 14.49998pt, for example:
@@ -647,15 +625,6 @@ Package fancyhdr Warning: \headheight is too small (12.0pt):
[3]
LaTeX Warning: Citation 'hoffmann2022trainingcomputeoptimallargelanguage' on pa
ge 4 undefined on input line 106.
LaTeX Warning: Citation 'hoffmann2022trainingcomputeoptimallargelanguage' on pa
ge 4 undefined on input line 106.
Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) Make it at least 14.49998pt, for example:
@@ -665,11 +634,6 @@ Package fancyhdr Warning: \headheight is too small (12.0pt):
[4]
LaTeX Warning: Citation 'hendrycks2021measuringmathematicalproblemsolving' on p
age 5 undefined on input line 139.
Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) Make it at least 14.49998pt, for example:
@@ -684,19 +648,6 @@ LaTeX Font Info: Trying to load font information for TS1+ptm on input line 1
File: ts1ptm.fd 2001/06/04 font definitions for TS1/ptm.
)
LaTeX Warning: Citation 'ahn2024largelanguagemodelsmathematical' on page 6 unde
fined on input line 162.
LaTeX Warning: Citation 'cobbe2021trainingverifierssolvemath' on page 6 undefin
ed on input line 162.
LaTeX Warning: Citation 'cobbe2021trainingverifierssolvemath' on page 6 undefin
ed on input line 162.
Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) Make it at least 14.49998pt, for example:
@@ -715,6 +666,11 @@ l.167 ...athbb{R}^{n \times d} \rightarrow \mathbb
{R}^{n \times d} \text{ su...
?
! Undefined control sequence.
l.178 ...input matrix. Here, $\mathbf{X}\in\mathbb
{R}^{n\times d}$ represent...
?
@@ -726,9 +682,14 @@ Package fancyhdr Warning: \headheight is too small (12.0pt):
[7]
LaTeX Warning: Empty bibliography on input line 186.
Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) Make it at least 14.49998pt, for example:
(fancyhdr) \setlength{\headheight}{14.49998pt}.
(fancyhdr) You might also make \topmargin smaller:
(fancyhdr) \addtolength{\topmargin}{-2.49998pt}.
[8]
Package fancyhdr Warning: \headheight is too small (12.0pt):
@@ -737,29 +698,20 @@ Package fancyhdr Warning: \headheight is too small (12.0pt):
(fancyhdr) You might also make \topmargin smaller:
(fancyhdr) \addtolength{\topmargin}{-2.49998pt}.
[8] (./EEMLA.aux)
[9] (./EEMLA.aux)
***********
LaTeX2e <2024-11-01> patch level 2
L3 programming layer <2025-01-18>
***********
LaTeX Warning: There were undefined references.
Package biblatex Warning: Please (re)run Biber on the file:
(biblatex) EEMLA
(biblatex) and rerun LaTeX afterwards.
Package logreq Info: Writing requests to 'EEMLA.run.xml'.
\openout1 = `EEMLA.run.xml'.
)
Here is how much of TeX's memory you used:
12030 strings out of 475171
224647 string characters out of 5767095
1112573 words of memory out of 5000000
34895 multiletter control sequences out of 15000+600000
12113 strings out of 475171
228166 string characters out of 5767095
1112870 words of memory out of 5000000
34976 multiletter control sequences out of 15000+600000
571519 words of font info for 64 fonts, out of 8000000 for 9000
14 hyphenation exceptions out of 8191
72i,18n,81p,1320b,2647s stack positions out of 10000i,1000n,20000p,200000b,200000s
@@ -772,10 +724,10 @@ hare/texmf-dist/fonts/type1/public/amsfonts/cm/cmsy10.pfb></usr/share/texmf-dis
t/fonts/type1/public/amsfonts/cm/cmsy8.pfb></usr/share/texmf-dist/fonts/type1/u
rw/times/utmb8a.pfb></usr/share/texmf-dist/fonts/type1/urw/times/utmr8a.pfb></u
sr/share/texmf-dist/fonts/type1/urw/times/utmri8a.pfb>
Output written on EEMLA.pdf (8 pages, 131155 bytes).
Output written on EEMLA.pdf (9 pages, 134566 bytes).
PDF statistics:
87 PDF objects out of 1000 (max. 8388607)
54 compressed objects within 1 object stream
90 PDF objects out of 1000 (max. 8388607)
56 compressed objects within 1 object stream
0 named destinations out of 1000 (max. 500000)
1 words of extra memory for PDF output out of 10000 (max. 10000000)

BIN
EEMLA.pdf

Binary file not shown.

View File

@@ -41,7 +41,7 @@
>
]>
<requests version="1.0">
<internal package="biblatex" priority="9" active="1">
<internal package="biblatex" priority="9" active="0">
<generic>latex</generic>
<provides type="dynamic">
<file>EEMLA.bcf</file>
@@ -64,7 +64,7 @@
<file>english-mla.lbx</file>
</requires>
</internal>
<external package="biblatex" priority="5" active="1">
<external package="biblatex" priority="5" active="0">
<generic>biber</generic>
<cmdline>
<binary>biber</binary>

View File

@@ -175,6 +175,12 @@ $$
\end{aligned}
$$
In the above example formulation of a fixed-index mutator function coupled with a self-attention layer for filtering noise from higher confidence inputs, specific transformations are applied at specific indices of the input matrix. Here, $\mathbf{X}\in\mathbb{R}^{n\times d}$ represents the input tensor for a given layer. $d$ is the embedding dimensionality, where the function $\mathcal{R}$ applies specific, discontinuous, logic based on identified patterns of the input located at specific indices. The mutated embedding is then processed through the standard attention mechanism to produce the output representation $\mathbf{Z}$. This output is then concatenated with the parallel layer(s) of the original neural network, allowing for an expansion of the network's capacity for operations without need for compromising on the token-based original throughput.
{\raggedright \normalsize \textit{Location-Based Rule Selection}}
A critical aspect of the methodology is the mechanism responsible for determining which rule is applicable at each position within the input matrix $\mathbf{X}$. Rather than relying on stochastic selection, this approach implements a deterministic, location-based rule selection strategy that leverages the contextual information encoded within the model's representations. A major advantage of this fixed-index approach is the minimization of dynamic surfaces in the model's cost function, thereby reducing the amount of noise in output, as well as reducing the required amount of training as over fitting is a non-issue without randomness.
%%%%Works cited
\newpage