<?xml version='1.0' encoding='utf-8'?>
<root><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>1</segment><segment>Global</segment><segment>Research</segment><segment>journal</segment><segment>of</segment><segment>Natural</segment><segment>Science</segment><segment>&amp;</segment><segment>Technology</segment><segment>(GRJNST)</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026),</segment><segment>2076</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>ISSN</segment><segment>E:</segment><segment>2790-7651</segment><segment>www.grjnst.net</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>AuthStateBench:</segment><segment>A</segment><segment>Standards-Aligned</segment><segment>Benchmark</segment><segment>for</segment><segment>Stateful</segment><segment>Authorization</segment><segment>and</segment><segment>Authentication</segment><segment>Workflows</segment><segment>Received:</segment><segment>01</segment><segment>April</segment><segment>2026.</segment><segment>Accepted:</segment><segment>23</segment><segment>April</segment><segment>2026.</segment><segment>Published:</segment><segment>29</segment><segment>April</segment><segment>2026</segment><segment>Muhammad</segment><segment>Shahzad</segment><segment>Khadim</segment><segment>(Corresponding</segment><segment>Author)</segment><segment>Kohat</segment><segment>University</segment><segment>of</segment><segment>Science</segment><segment>and</segment><segment>Technology,</segment><segment>Kohat,</segment><segment>Pakistan</segment><segment>ytshahzad257@gmail.com</segment><segment>Syed</segment><segment>Mufassir</segment><segment>Shah</segment><segment>Kohat</segment><segment>University</segment><segment>of</segment><segment>Science</segment><segment>and</segment><segment>Technology,</segment><segment>Kohat,</segment><segment>Pakistan</segment><segment>mufassirshah3@gmail.com</segment><segment>Zubair</segment><segment>Khan</segment><segment>International</segment><segment>Islamic</segment><segment>University</segment><segment>Islamabad</segment><segment>Islamabad,</segment><segment>Pakistan</segment><segment>zubairafridi2312@gmail.com</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>Copyright</segment><segment>©</segment><segment>2026</segment><segment>GRJNST.</segment><segment>This</segment><segment>article</segment><segment>is</segment><segment>published</segment><segment>under</segment><segment>an</segment><segment>Open</segment><segment>Access</segment><segment>model.</segment><segment>It</segment><segment>is</segment><segment>made</segment><segment>available</segment><segment>to</segment><segment>the</segment><segment>public</segment><segment>under</segment><segment>the</segment><segment>terms</segment><segment>of</segment><segment>the</segment><segment>Creative</segment><segment>Commons</segment><segment>Attribution</segment><segment>4.0</segment><segment>International</segment><segment>(CC</segment><segment>BY</segment><segment>4.0)</segment><segment>license,</segment><segment>which</segment><segment>permits</segment><segment>unrestricted</segment><segment>use</segment><segment>and</segment><segment>distribution</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>2</segment><segment>Abstract</segment><segment>Authentication</segment><segment>and</segment><segment>authorization</segment><segment>weaknesses</segment><segment>in</segment><segment>modern</segment><segment>web</segment><segment>applications</segment><segment>rarely</segment><segment>arise</segment><segment>as</segment><segment>isolated</segment><segment>request-level</segment><segment>defects.</segment><segment>They</segment><segment>often</segment><segment>depend</segment><segment>on</segment><segment>role</segment><segment>changes,</segment><segment>session</segment><segment>lifecycle</segment><segment>conditions,</segment><segment>object</segment><segment>ownership</segment><segment>boundaries,</segment><segment>API</segment><segment>authorization</segment><segment>rules,</segment><segment>and</segment><segment>business</segment><segment>workflow</segment><segment>ordering.</segment><segment>Existing</segment><segment>vulnerability</segment><segment>benchmarks</segment><segment>and</segment><segment>scanner</segment><segment>evaluations</segment><segment>remain</segment><segment>valuable,</segment><segment>but</segment><segment>they</segment><segment>often</segment><segment>represent</segment><segment>weaknesses</segment><segment>as</segment><segment>code-level</segment><segment>or</segment><segment>input-output</segment><segment>defects</segment><segment>and</segment><segment>therefore</segment><segment>underrepresent</segment><segment>semantic</segment><segment>failures</segment><segment>such</segment><segment>as</segment><segment>IDOR/BOLA,</segment><segment>function-level</segment><segment>authorization</segment><segment>bypass,</segment><segment>stale-session</segment><segment>reuse,</segment><segment>tenant-</segment><segment>boundary</segment><segment>violation,</segment><segment>privilege</segment><segment>transition</segment><segment>errors,</segment><segment>and</segment><segment>workflow</segment><segment>bypass.</segment><segment>This</segment><segment>article</segment><segment>introduces</segment><segment>AuthStateBench,</segment><segment>a</segment><segment>standards-aligned</segment><segment>benchmark</segment><segment>design</segment><segment>for</segment><segment>modeling</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>vulnerabilities</segment><segment>in</segment><segment>web</segment><segment>applications</segment><segment>and</segment><segment>APIs.</segment><segment>The</segment><segment>study</segment><segment>uses</segment><segment>a</segment><segment>structured</segment><segment>literature-based</segment><segment>and</segment><segment>standards-</segment><segment>mapping</segment><segment>methodology</segment><segment>that</segment><segment>draws</segment><segment>on</segment><segment>access-control</segment><segment>testing</segment><segment>research,</segment><segment>stateful</segment><segment>web</segment><segment>testing,</segment><segment>web</segment><segment>logic</segment><segment>flaw</segment><segment>analysis,</segment><segment>scanner-evaluation</segment><segment>studies,</segment><segment>vulnerability</segment><segment>benchmark</segment><segment>literature,</segment><segment>AI-assisted</segment><segment>vulnerability-analysis</segment><segment>work,</segment><segment>and</segment><segment>major</segment><segment>security</segment><segment>guidance</segment><segment>including</segment><segment>OWASP</segment><segment>Top</segment><segment>10,</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10,</segment><segment>OWASP</segment><segment>ASVS,</segment><segment>OWASP</segment><segment>WSTG,</segment><segment>NIST</segment><segment>SSDF,</segment><segment>MITRE</segment><segment>CWE,</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design,</segment><segment>OAuth</segment><segment>2.0</segment><segment>security</segment><segment>guidance,</segment><segment>OpenID</segment><segment>Connect,</segment><segment>and</segment><segment>software-assurance</segment><segment>benchmark</segment><segment>resources.</segment><segment>AuthStateBench</segment><segment>contributes</segment><segment>a</segment><segment>four-dimensional</segment><segment>state</segment><segment>model</segment><segment>built</segment><segment>around</segment><segment>role</segment><segment>state,</segment><segment>session</segment><segment>state,</segment><segment>object-ownership</segment><segment>state,</segment><segment>and</segment><segment>workflow</segment><segment>state;</segment><segment>a</segment><segment>scenario</segment><segment>taxonomy;</segment><segment>a</segment><segment>benchmark</segment><segment>scenario</segment><segment>template;</segment><segment>standards-mapping</segment><segment>logic;</segment><segment>formal</segment><segment>scenario</segment><segment>and</segment><segment>coverage</segment><segment>equations;</segment><segment>and</segment><segment>comparison</segment><segment>criteria</segment><segment>for</segment><segment>manual,</segment><segment>scanner-assisted,</segment><segment>AI-</segment><segment>assisted,</segment><segment>and</segment><segment>standards-based</segment><segment>assessment.</segment><segment>The</segment><segment>article</segment><segment>does</segment><segment>not</segment><segment>claim</segment><segment>empirical</segment><segment>detection</segment><segment>accuracy,</segment><segment>tool</segment><segment>execution,</segment><segment>live-system</segment><segment>testing,</segment><segment>or</segment><segment>dataset</segment><segment>results.</segment><segment>Instead,</segment><segment>it</segment><segment>provides</segment><segment>a</segment><segment>reproducible</segment><segment>design</segment><segment>artifact</segment><segment>and</segment><segment>validation</segment><segment>roadmap</segment><segment>for</segment><segment>future</segment><segment>controlled</segment><segment>implementation</segment><segment>and</segment><segment>comparative</segment><segment>evaluation.</segment><segment>Keywords:</segment><segment>Web</segment><segment>application</segment><segment>security;</segment><segment>broken</segment><segment>access</segment><segment>control;</segment><segment>authentication</segment><segment>workflow;</segment><segment>authorization</segment><segment>testing;</segment><segment>benchmark</segment><segment>design;</segment><segment>stateful</segment><segment>security</segment><segment>testing</segment><segment>1.</segment><segment>Introduction</segment><segment>1.1</segment><segment>Background</segment><segment>Modern</segment><segment>web</segment><segment>applications</segment><segment>rarely</segment><segment>fail</segment><segment>through</segment><segment>a</segment><segment>single</segment><segment>isolated</segment><segment>defect.</segment><segment>Their</segment><segment>security</segment><segment>posture</segment><segment>emerges</segment><segment>from</segment><segment>the</segment><segment>interaction</segment><segment>of</segment><segment>identity</segment><segment>providers,</segment><segment>session</segment><segment>stores,</segment><segment>API</segment><segment>gateways,</segment><segment>access-</segment><segment>control</segment><segment>middleware,</segment><segment>object-level</segment><segment>permission</segment><segment>checks,</segment><segment>business</segment><segment>workflows,</segment><segment>audit</segment><segment>mechanisms,</segment><segment>and</segment><segment>recovery</segment><segment>logic.</segment><segment>A</segment><segment>request</segment><segment>that</segment><segment>appears</segment><segment>harmless</segment><segment>in</segment><segment>isolation</segment><segment>may</segment><segment>become</segment><segment>dangerous</segment><segment>when</segment><segment>it</segment><segment>is</segment><segment>executed</segment><segment>with</segment><segment>the</segment><segment>wrong</segment><segment>role,</segment><segment>a</segment><segment>stale</segment><segment>session,</segment><segment>an</segment><segment>unowned</segment><segment>object</segment><segment>identifier,</segment><segment>or</segment><segment>a</segment><segment>skipped</segment><segment>workflow</segment><segment>step.</segment><segment>This</segment><segment>stateful</segment><segment>character</segment><segment>is</segment><segment>especially</segment><segment>visible</segment><segment>in</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>flaws.</segment><segment>A</segment><segment>user</segment><segment>may</segment><segment>be</segment><segment>authenticated</segment><segment>but</segment><segment>still</segment><segment>unauthorized</segment><segment>to</segment><segment>perform</segment><segment>a</segment><segment>function;</segment><segment>an</segment><segment>expired</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>3</segment><segment>token</segment><segment>may</segment><segment>be</segment><segment>accepted</segment><segment>after</segment><segment>logout;</segment><segment>an</segment><segment>object</segment><segment>identifier</segment><segment>may</segment><segment>expose</segment><segment>another</segment><segment>user's</segment><segment>record;</segment><segment>or</segment><segment>a</segment><segment>workflow</segment><segment>endpoint</segment><segment>may</segment><segment>allow</segment><segment>an</segment><segment>operation</segment><segment>before</segment><segment>the</segment><segment>required</segment><segment>approval</segment><segment>state</segment><segment>has</segment><segment>been</segment><segment>reached.</segment><segment>The</segment><segment>current</segment><segment>application-security</segment><segment>landscape</segment><segment>confirms</segment><segment>the</segment><segment>importance</segment><segment>of</segment><segment>this</segment><segment>problem.</segment><segment>OWASP</segment><segment>Top</segment><segment>10:2025</segment><segment>identifies</segment><segment>Broken</segment><segment>Access</segment><segment>Control</segment><segment>as</segment><segment>the</segment><segment>leading</segment><segment>web</segment><segment>application</segment><segment>security</segment><segment>risk,</segment><segment>and</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10:2023</segment><segment>places</segment><segment>Broken</segment><segment>Object</segment><segment>Level</segment><segment>Authorization</segment><segment>at</segment><segment>the</segment><segment>first</segment><segment>position</segment><segment>for</segment><segment>API</segment><segment>security</segment><segment>risk</segment><segment>[1]-[4].</segment><segment>OWASP</segment><segment>ASVS</segment><segment>5.0.0</segment><segment>and</segment><segment>the</segment><segment>OWASP</segment><segment>Web</segment><segment>Security</segment><segment>Testing</segment><segment>Guide</segment><segment>provide</segment><segment>deeper</segment><segment>verification</segment><segment>and</segment><segment>testing</segment><segment>guidance</segment><segment>for</segment><segment>authentication,</segment><segment>session</segment><segment>management,</segment><segment>access</segment><segment>control,</segment><segment>API</segment><segment>behavior,</segment><segment>and</segment><segment>business</segment><segment>logic</segment><segment>[5],</segment><segment>[6].</segment><segment>NIST</segment><segment>SSDF</segment><segment>and</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>guidance</segment><segment>frame</segment><segment>these</segment><segment>weaknesses</segment><segment>as</segment><segment>secure-development</segment><segment>and</segment><segment>product-</segment><segment>responsibility</segment><segment>concerns</segment><segment>rather</segment><segment>than</segment><segment>isolated</segment><segment>testing</segment><segment>events</segment><segment>[8],</segment><segment>[19],</segment><segment>[20].</segment><segment>Despite</segment><segment>the</segment><segment>availability</segment><segment>of</segment><segment>these</segment><segment>standards,</segment><segment>there</segment><segment>remains</segment><segment>a</segment><segment>benchmark-design</segment><segment>problem.</segment><segment>Existing</segment><segment>vulnerability</segment><segment>benchmarks</segment><segment>such</segment><segment>as</segment><segment>OWASP</segment><segment>Benchmark,</segment><segment>NIST</segment><segment>SARD,</segment><segment>and</segment><segment>Juliet</segment><segment>provide</segment><segment>valuable</segment><segment>tool-evaluation</segment><segment>support,</segment><segment>but</segment><segment>their</segment><segment>structure</segment><segment>is</segment><segment>stronger</segment><segment>for</segment><segment>code-level</segment><segment>and</segment><segment>input-driven</segment><segment>weakness</segment><segment>classes</segment><segment>than</segment><segment>for</segment><segment>multi-step</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>failures</segment><segment>that</segment><segment>depend</segment><segment>on</segment><segment>role,</segment><segment>session,</segment><segment>object,</segment><segment>and</segment><segment>workflow</segment><segment>state</segment><segment>[7],</segment><segment>[9]-[11].</segment><segment>This</segment><segment>gap</segment><segment>matters</segment><segment>because</segment><segment>scanners,</segment><segment>AI-assisted</segment><segment>testing</segment><segment>systems,</segment><segment>manual</segment><segment>testers,</segment><segment>and</segment><segment>secure-development</segment><segment>teams</segment><segment>need</segment><segment>comparable</segment><segment>scenario</segment><segment>definitions</segment><segment>before</segment><segment>meaningful</segment><segment>evaluation</segment><segment>can</segment><segment>occur.</segment><segment>1.2</segment><segment>Problem</segment><segment>Statement</segment><segment>The</segment><segment>central</segment><segment>problem</segment><segment>addressed</segment><segment>in</segment><segment>this</segment><segment>article</segment><segment>is</segment><segment>that</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>vulnerabilities</segment><segment>are</segment><segment>difficult</segment><segment>to</segment><segment>benchmark</segment><segment>using</segment><segment>isolated</segment><segment>HTTP</segment><segment>requests,</segment><segment>generic</segment><segment>scanner</segment><segment>signatures,</segment><segment>or</segment><segment>code</segment><segment>snippets</segment><segment>detached</segment><segment>from</segment><segment>application</segment><segment>state.</segment><segment>A</segment><segment>conventional</segment><segment>vulnerability</segment><segment>test</segment><segment>case</segment><segment>often</segment><segment>asks</segment><segment>whether</segment><segment>a</segment><segment>specific</segment><segment>payload</segment><segment>triggers</segment><segment>a</segment><segment>specific</segment><segment>response.</segment><segment>In</segment><segment>contrast,</segment><segment>a</segment><segment>stateful</segment><segment>authorization</segment><segment>flaw</segment><segment>may</segment><segment>require</segment><segment>two</segment><segment>or</segment><segment>more</segment><segment>accounts,</segment><segment>at</segment><segment>least</segment><segment>one</segment><segment>protected</segment><segment>object,</segment><segment>a</segment><segment>known</segment><segment>workflow</segment><segment>state,</segment><segment>a</segment><segment>token</segment><segment>lifecycle</segment><segment>condition,</segment><segment>and</segment><segment>an</segment><segment>expected</segment><segment>policy</segment><segment>decision.</segment><segment>Without</segment><segment>documenting</segment><segment>these</segment><segment>conditions,</segment><segment>two</segment><segment>studies</segment><segment>may</segment><segment>appear</segment><segment>to</segment><segment>evaluate</segment><segment>the</segment><segment>same</segment><segment>vulnerability</segment><segment>category</segment><segment>while</segment><segment>actually</segment><segment>testing</segment><segment>different</segment><segment>security</segment><segment>properties.</segment><segment>This</segment><segment>creates</segment><segment>three</segment><segment>practical</segment><segment>weaknesses</segment><segment>in</segment><segment>the</segment><segment>research</segment><segment>landscape.</segment><segment>First,</segment><segment>scanner</segment><segment>evaluations</segment><segment>can</segment><segment>overrepresent</segment><segment>input-driven</segment><segment>flaws</segment><segment>while</segment><segment>underrepresenting</segment><segment>semantic</segment><segment>authorization</segment><segment>failures.</segment><segment>Second,</segment><segment>AI-assisted</segment><segment>testing</segment><segment>studies</segment><segment>may</segment><segment>claim</segment><segment>progress</segment><segment>without</segment><segment>showing</segment><segment>whether</segment><segment>role,</segment><segment>session,</segment><segment>object</segment><segment>ownership,</segment><segment>and</segment><segment>workflow</segment><segment>preconditions</segment><segment>were</segment><segment>modeled.</segment><segment>Third,</segment><segment>secure-</segment><segment>development</segment><segment>guidance</segment><segment>may</segment><segment>remain</segment><segment>difficult</segment><segment>to</segment><segment>operationalize</segment><segment>because</segment><segment>standards</segment><segment>requirements</segment><segment>are</segment><segment>not</segment><segment>translated</segment><segment>into</segment><segment>benchmark</segment><segment>scenario</segment><segment>templates.</segment><segment>The</segment><segment>problem</segment><segment>is</segment><segment>therefore</segment><segment>not</segment><segment>a</segment><segment>lack</segment><segment>of</segment><segment>standards</segment><segment>or</segment><segment>individual</segment><segment>testing</segment><segment>techniques;</segment><segment>the</segment><segment>problem</segment><segment>is</segment><segment>the</segment><segment>absence</segment><segment>of</segment><segment>a</segment><segment>structured</segment><segment>benchmark</segment><segment>design</segment><segment>that</segment><segment>connects</segment><segment>standards,</segment><segment>state</segment><segment>dimensions,</segment><segment>scenario</segment><segment>categories,</segment><segment>and</segment><segment>evaluation</segment><segment>criteria.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>4</segment><segment>1.3</segment><segment>Research</segment><segment>Gap</segment><segment>Prior</segment><segment>work</segment><segment>has</segment><segment>examined</segment><segment>web</segment><segment>application</segment><segment>security,</segment><segment>automated</segment><segment>vulnerability</segment><segment>detection,</segment><segment>access-</segment><segment>control</segment><segment>analysis,</segment><segment>business</segment><segment>logic</segment><segment>flaws,</segment><segment>scanner</segment><segment>performance,</segment><segment>and</segment><segment>software-vulnerability</segment><segment>benchmarks</segment><segment>[26]-[40].</segment><segment>However,</segment><segment>the</segment><segment>literature</segment><segment>remains</segment><segment>fragmented</segment><segment>when</segment><segment>the</segment><segment>target</segment><segment>weakness</segment><segment>depends</segment><segment>on</segment><segment>a</segment><segment>combination</segment><segment>of</segment><segment>authenticated</segment><segment>identity,</segment><segment>authorization</segment><segment>policy,</segment><segment>object</segment><segment>ownership,</segment><segment>token</segment><segment>lifecycle,</segment><segment>request</segment><segment>ordering,</segment><segment>and</segment><segment>business-state</segment><segment>transition.</segment><segment>A</segment><segment>stronger</segment><segment>benchmark</segment><segment>design</segment><segment>is</segment><segment>needed</segment><segment>to</segment><segment>make</segment><segment>such</segment><segment>weaknesses</segment><segment>reproducible</segment><segment>and</segment><segment>comparable</segment><segment>across</segment><segment>testing</segment><segment>approaches.</segment><segment>The</segment><segment>precise</segment><segment>research</segment><segment>gap</segment><segment>is</segment><segment>as</segment><segment>follows:</segment><segment>existing</segment><segment>web</segment><segment>security</segment><segment>research</segment><segment>lacks</segment><segment>a</segment><segment>standards-</segment><segment>aligned</segment><segment>benchmark</segment><segment>design</segment><segment>that</segment><segment>systematically</segment><segment>models</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>vulnerabilities</segment><segment>using</segment><segment>role,</segment><segment>session,</segment><segment>object-ownership,</segment><segment>and</segment><segment>workflow-</segment><segment>state</segment><segment>dimensions.</segment><segment>This</segment><segment>gap</segment><segment>prevents</segment><segment>consistent</segment><segment>comparison</segment><segment>of</segment><segment>manual</segment><segment>testing,</segment><segment>scanner-assisted</segment><segment>testing,</segment><segment>AI-assisted</segment><segment>testing,</segment><segment>and</segment><segment>standards-based</segment><segment>review</segment><segment>for</segment><segment>flaws</segment><segment>such</segment><segment>as</segment><segment>IDOR/BOLA,</segment><segment>privilege</segment><segment>escalation,</segment><segment>session</segment><segment>misuse,</segment><segment>role</segment><segment>confusion,</segment><segment>and</segment><segment>workflow</segment><segment>bypass.</segment><segment>1.4</segment><segment>Aim</segment><segment>and</segment><segment>Objectives</segment><segment>The</segment><segment>aim</segment><segment>of</segment><segment>this</segment><segment>article</segment><segment>is</segment><segment>to</segment><segment>design</segment><segment>a</segment><segment>standards-aligned</segment><segment>benchmark</segment><segment>model</segment><segment>for</segment><segment>classifying,</segment><segment>structuring,</segment><segment>and</segment><segment>evaluating</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>vulnerabilities</segment><segment>in</segment><segment>modern</segment><segment>web</segment><segment>applications.</segment><segment>The</segment><segment>objectives</segment><segment>are:</segment><segment>(1)</segment><segment>to</segment><segment>review</segment><segment>literature</segment><segment>on</segment><segment>broken</segment><segment>access</segment><segment>control,</segment><segment>authentication</segment><segment>workflow</segment><segment>flaws,</segment><segment>stateful</segment><segment>web</segment><segment>security</segment><segment>testing,</segment><segment>benchmark-based</segment><segment>evaluation,</segment><segment>scanner</segment><segment>limitations,</segment><segment>and</segment><segment>AI-</segment><segment>assisted</segment><segment>vulnerability</segment><segment>analysis;</segment><segment>(2)</segment><segment>to</segment><segment>identify</segment><segment>recurring</segment><segment>patterns</segment><segment>involving</segment><segment>role</segment><segment>misuse,</segment><segment>object</segment><segment>ownership,</segment><segment>session</segment><segment>state,</segment><segment>workflow</segment><segment>bypass,</segment><segment>token</segment><segment>lifecycle</segment><segment>errors,</segment><segment>and</segment><segment>privilege</segment><segment>transitions;</segment><segment>(3)</segment><segment>to</segment><segment>map</segment><segment>these</segment><segment>patterns</segment><segment>to</segment><segment>OWASP</segment><segment>Top</segment><segment>10:2025,</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10,</segment><segment>OWASP</segment><segment>ASVS,</segment><segment>OWASP</segment><segment>WSTG,</segment><segment>NIST</segment><segment>SSDF,</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>guidance,</segment><segment>and</segment><segment>MITRE</segment><segment>CWE;</segment><segment>(4)</segment><segment>to</segment><segment>develop</segment><segment>a</segment><segment>benchmark</segment><segment>scenario</segment><segment>taxonomy</segment><segment>for</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>weaknesses;</segment><segment>(5)</segment><segment>to</segment><segment>define</segment><segment>evaluation</segment><segment>criteria</segment><segment>for</segment><segment>manual</segment><segment>testing,</segment><segment>scanner-assisted</segment><segment>testing,</segment><segment>AI-assisted</segment><segment>testing,</segment><segment>and</segment><segment>standards-based</segment><segment>review;</segment><segment>and</segment><segment>(6)</segment><segment>to</segment><segment>propose</segment><segment>a</segment><segment>benchmark</segment><segment>documentation</segment><segment>template</segment><segment>and</segment><segment>future</segment><segment>validation</segment><segment>roadmap.</segment><segment>1.5</segment><segment>Research</segment><segment>Questions</segment><segment>RQ1.</segment><segment>What</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>vulnerabilities</segment><segment>are</segment><segment>most</segment><segment>frequently</segment><segment>discussed</segment><segment>in</segment><segment>recent</segment><segment>web</segment><segment>application</segment><segment>security</segment><segment>literature?</segment><segment>RQ2.</segment><segment>How</segment><segment>can</segment><segment>role,</segment><segment>session,</segment><segment>object</segment><segment>ownership,</segment><segment>and</segment><segment>workflow</segment><segment>state</segment><segment>be</segment><segment>used</segment><segment>to</segment><segment>classify</segment><segment>authentication</segment><segment>and</segment><segment>access-control</segment><segment>weaknesses?</segment><segment>RQ3.</segment><segment>How</segment><segment>can</segment><segment>OWASP</segment><segment>Top</segment><segment>10:2025,</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10,</segment><segment>OWASP</segment><segment>ASVS,</segment><segment>OWASP</segment><segment>WSTG,</segment><segment>NIST</segment><segment>SSDF,</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>guidance,</segment><segment>and</segment><segment>MITRE</segment><segment>CWE</segment><segment>be</segment><segment>mapped</segment><segment>to</segment><segment>benchmark</segment><segment>scenarios</segment><segment>for</segment><segment>stateful</segment><segment>web</segment><segment>security</segment><segment>testing?</segment><segment>RQ4.</segment><segment>What</segment><segment>benchmark</segment><segment>scenario</segment><segment>categories</segment><segment>are</segment><segment>needed</segment><segment>to</segment><segment>represent</segment><segment>IDOR/BOLA,</segment><segment>privilege</segment><segment>escalation,</segment><segment>session</segment><segment>misuse,</segment><segment>workflow</segment><segment>bypass,</segment><segment>role</segment><segment>confusion,</segment><segment>and</segment><segment>token</segment><segment>lifecycle</segment><segment>weaknesses?</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>5</segment><segment>RQ5.</segment><segment>What</segment><segment>evaluation</segment><segment>criteria</segment><segment>can</segment><segment>compare</segment><segment>manual,</segment><segment>scanner-assisted,</segment><segment>AI-assisted,</segment><segment>and</segment><segment>standards-based</segment><segment>testing</segment><segment>approaches</segment><segment>without</segment><segment>reporting</segment><segment>unsupported</segment><segment>empirical</segment><segment>results?</segment><segment>RQ6.</segment><segment>What</segment><segment>limitations</segment><segment>exist</segment><segment>in</segment><segment>current</segment><segment>web</segment><segment>security</segment><segment>benchmarks</segment><segment>for</segment><segment>evaluating</segment><segment>access-control</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>flaws?</segment><segment>RQ7.</segment><segment>What</segment><segment>future</segment><segment>validation</segment><segment>pathway</segment><segment>is</segment><segment>required</segment><segment>to</segment><segment>make</segment><segment>AuthStateBench</segment><segment>suitable</segment><segment>for</segment><segment>empirical</segment><segment>cybersecurity</segment><segment>research?</segment><segment>1.6</segment><segment>Scope</segment><segment>The</segment><segment>scope</segment><segment>of</segment><segment>AuthStateBench</segment><segment>is</segment><segment>benchmark</segment><segment>design,</segment><segment>scenario</segment><segment>structuring,</segment><segment>standards</segment><segment>mapping,</segment><segment>evaluation</segment><segment>logic,</segment><segment>and</segment><segment>future</segment><segment>validation</segment><segment>planning.</segment><segment>The</segment><segment>article</segment><segment>focuses</segment><segment>on</segment><segment>web</segment><segment>applications</segment><segment>and</segment><segment>web</segment><segment>APIs</segment><segment>where</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>outcomes</segment><segment>depend</segment><segment>on</segment><segment>state.</segment><segment>The</segment><segment>benchmark</segment><segment>design</segment><segment>is</segment><segment>intentionally</segment><segment>abstract:</segment><segment>it</segment><segment>does</segment><segment>not</segment><segment>require</segment><segment>unauthorized</segment><segment>testing</segment><segment>of</segment><segment>real</segment><segment>systems,</segment><segment>private</segment><segment>datasets,</segment><segment>exploit</segment><segment>demonstrations,</segment><segment>scanner</segment><segment>output,</segment><segment>screenshots,</segment><segment>or</segment><segment>fabricated</segment><segment>tool</segment><segment>results.</segment><segment>It</segment><segment>is</segment><segment>suitable</segment><segment>for</segment><segment>later</segment><segment>implementation</segment><segment>in</segment><segment>controlled</segment><segment>vulnerable</segment><segment>applications,</segment><segment>teaching</segment><segment>laboratories,</segment><segment>controlled</segment><segment>research</segment><segment>environments,</segment><segment>or</segment><segment>expert-review</segment><segment>exercises.</segment><segment>The</segment><segment>scope</segment><segment>excludes</segment><segment>malware</segment><segment>analysis,</segment><segment>network</segment><segment>intrusion</segment><segment>detection,</segment><segment>blockchain</segment><segment>security,</segment><segment>IoT</segment><segment>firmware</segment><segment>testing,</segment><segment>and</segment><segment>generic</segment><segment>AI-in-cybersecurity</segment><segment>discussions</segment><segment>unless</segment><segment>they</segment><segment>directly</segment><segment>inform</segment><segment>benchmark-design</segment><segment>principles.</segment><segment>The</segment><segment>article</segment><segment>also</segment><segment>excludes</segment><segment>claims</segment><segment>of</segment><segment>detection</segment><segment>accuracy</segment><segment>because</segment><segment>no</segment><segment>tool</segment><segment>execution</segment><segment>or</segment><segment>empirical</segment><segment>implementation</segment><segment>is</segment><segment>reported.</segment><segment>1.7</segment><segment>Contributions</segment><segment>This</segment><segment>article</segment><segment>makes</segment><segment>five</segment><segment>concrete</segment><segment>contributions.</segment><segment>First,</segment><segment>it</segment><segment>proposes</segment><segment>AuthStateBench,</segment><segment>a</segment><segment>benchmark-design</segment><segment>artifact</segment><segment>for</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>weaknesses</segment><segment>in</segment><segment>web</segment><segment>applications</segment><segment>and</segment><segment>APIs.</segment><segment>Second,</segment><segment>it</segment><segment>defines</segment><segment>a</segment><segment>four-dimensional</segment><segment>state</segment><segment>model</segment><segment>that</segment><segment>captures</segment><segment>role</segment><segment>state,</segment><segment>session</segment><segment>state,</segment><segment>object-ownership</segment><segment>state,</segment><segment>and</segment><segment>workflow</segment><segment>state.</segment><segment>Third,</segment><segment>it</segment><segment>introduces</segment><segment>a</segment><segment>template</segment><segment>for</segment><segment>repeatable</segment><segment>benchmark</segment><segment>scenario</segment><segment>construction.</segment><segment>Fourth,</segment><segment>it</segment><segment>adds</segment><segment>a</segment><segment>standards-mapping</segment><segment>layer</segment><segment>that</segment><segment>connects</segment><segment>scenario</segment><segment>classes</segment><segment>to</segment><segment>OWASP,</segment><segment>ASVS,</segment><segment>WSTG,</segment><segment>NIST</segment><segment>SSDF,</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design,</segment><segment>MITRE</segment><segment>CWE,</segment><segment>OAuth,</segment><segment>and</segment><segment>OpenID</segment><segment>guidance.</segment><segment>Fifth,</segment><segment>it</segment><segment>defines</segment><segment>evidence-based</segment><segment>comparison</segment><segment>criteria</segment><segment>for</segment><segment>manual</segment><segment>testing,</segment><segment>scanner-assisted</segment><segment>testing,</segment><segment>AI-assisted</segment><segment>testing,</segment><segment>and</segment><segment>standards-based</segment><segment>review</segment><segment>without</segment><segment>inventing</segment><segment>unsupported</segment><segment>empirical</segment><segment>results.</segment><segment>taxonomy</segment><segment>and</segment><segment>editable</segment><segment>documentation</segment><segment>The</segment><segment>contribution</segment><segment>differs</segment><segment>from</segment><segment>a</segment><segment>generic</segment><segment>OWASP</segment><segment>survey</segment><segment>because</segment><segment>it</segment><segment>does</segment><segment>not</segment><segment>merely</segment><segment>summarize</segment><segment>risk</segment><segment>categories.</segment><segment>It</segment><segment>translates</segment><segment>recurring</segment><segment>access-control</segment><segment>and</segment><segment>authentication</segment><segment>failure</segment><segment>patterns</segment><segment>into</segment><segment>reusable</segment><segment>scenario</segment><segment>classes.</segment><segment>It</segment><segment>also</segment><segment>differs</segment><segment>from</segment><segment>a</segment><segment>scanner-evaluation</segment><segment>paper</segment><segment>because</segment><segment>it</segment><segment>does</segment><segment>not</segment><segment>claim</segment><segment>performance</segment><segment>measurements.</segment><segment>Instead,</segment><segment>it</segment><segment>prepares</segment><segment>a</segment><segment>benchmark</segment><segment>structure</segment><segment>that</segment><segment>can</segment><segment>later</segment><segment>support</segment><segment>such</segment><segment>measurements</segment><segment>transparently.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>6</segment><segment>1.8</segment><segment>Structure</segment><segment>of</segment><segment>the</segment><segment>Paper</segment><segment>Section</segment><segment>2</segment><segment>reviews</segment><segment>key</segment><segment>concepts,</segment><segment>recent</segment><segment>studies,</segment><segment>standards,</segment><segment>and</segment><segment>limitations</segment><segment>of</segment><segment>existing</segment><segment>work.</segment><segment>Section</segment><segment>3</segment><segment>presents</segment><segment>AuthStateBench</segment><segment>and</segment><segment>its</segment><segment>conceptual</segment><segment>components.</segment><segment>Section</segment><segment>4</segment><segment>explains</segment><segment>the</segment><segment>structured</segment><segment>literature-based</segment><segment>and</segment><segment>standards-mapping</segment><segment>methodology.</segment><segment>Section</segment><segment>5</segment><segment>presents</segment><segment>analytical</segment><segment>findings,</segment><segment>benchmark</segment><segment>outputs,</segment><segment>standards</segment><segment>alignment,</segment><segment>and</segment><segment>comparison</segment><segment>with</segment><segment>existing</segment><segment>approaches.</segment><segment>Section</segment><segment>6</segment><segment>discusses</segment><segment>implications,</segment><segment>limitations,</segment><segment>and</segment><segment>future</segment><segment>research.</segment><segment>Section</segment><segment>7</segment><segment>concludes</segment><segment>the</segment><segment>article.</segment><segment>Fig.</segment><segment>1</segment><segment>summarizes</segment><segment>the</segment><segment>article's</segment><segment>logic</segment><segment>in</segment><segment>a</segment><segment>roadmap</segment><segment>style:</segment><segment>evidence</segment><segment>is</segment><segment>gathered,</segment><segment>gaps</segment><segment>are</segment><segment>synthesized,</segment><segment>the</segment><segment>state</segment><segment>model</segment><segment>is</segment><segment>defined,</segment><segment>benchmark</segment><segment>artifacts</segment><segment>are</segment><segment>produced,</segment><segment>and</segment><segment>validation</segment><segment>is</segment><segment>reserved</segment><segment>for</segment><segment>controlled</segment><segment>future</segment><segment>work.</segment><segment>Fig.</segment><segment>1.</segment><segment>Research</segment><segment>roadmap</segment><segment>and</segment><segment>logical</segment><segment>framework</segment><segment>for</segment><segment>AuthStateBench.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>7</segment><segment>2.</segment><segment>Literature</segment><segment>Review</segment><segment>2.1</segment><segment>Key</segment><segment>Concepts</segment><segment>Authentication</segment><segment>verifies</segment><segment>the</segment><segment>identity</segment><segment>of</segment><segment>an</segment><segment>entity,</segment><segment>while</segment><segment>authorization</segment><segment>determines</segment><segment>whether</segment><segment>that</segment><segment>entity</segment><segment>may</segment><segment>access</segment><segment>a</segment><segment>resource</segment><segment>or</segment><segment>perform</segment><segment>a</segment><segment>function.</segment><segment>Session</segment><segment>management</segment><segment>maintains</segment><segment>continuity</segment><segment>between</segment><segment>authenticated</segment><segment>interactions,</segment><segment>often</segment><segment>through</segment><segment>cookies,</segment><segment>bearer</segment><segment>tokens,</segment><segment>refresh</segment><segment>tokens,</segment><segment>or</segment><segment>server-side</segment><segment>session</segment><segment>identifiers.</segment><segment>Object-level</segment><segment>authorization</segment><segment>checks</segment><segment>whether</segment><segment>a</segment><segment>user</segment><segment>may</segment><segment>access</segment><segment>a</segment><segment>specific</segment><segment>object</segment><segment>instance,</segment><segment>not</segment><segment>merely</segment><segment>whether</segment><segment>the</segment><segment>user</segment><segment>belongs</segment><segment>to</segment><segment>a</segment><segment>broad</segment><segment>role.</segment><segment>Workflow</segment><segment>authorization</segment><segment>checks</segment><segment>whether</segment><segment>an</segment><segment>action</segment><segment>is</segment><segment>permitted</segment><segment>at</segment><segment>a</segment><segment>particular</segment><segment>stage</segment><segment>of</segment><segment>a</segment><segment>business</segment><segment>process.</segment><segment>These</segment><segment>concepts</segment><segment>are</segment><segment>separated</segment><segment>analytically</segment><segment>but</segment><segment>often</segment><segment>fail</segment><segment>together</segment><segment>in</segment><segment>real</segment><segment>applications.</segment><segment>A</segment><segment>benchmark</segment><segment>for</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>weaknesses</segment><segment>must</segment><segment>therefore</segment><segment>model</segment><segment>more</segment><segment>than</segment><segment>a</segment><segment>vulnerability</segment><segment>label.</segment><segment>For</segment><segment>example,</segment><segment>IDOR/BOLA</segment><segment>is</segment><segment>not</segment><segment>simply</segment><segment>“changing</segment><segment>an</segment><segment>ID.”</segment><segment>It</segment><segment>is</segment><segment>a</segment><segment>failure</segment><segment>to</segment><segment>enforce</segment><segment>ownership</segment><segment>or</segment><segment>tenant</segment><segment>isolation</segment><segment>when</segment><segment>a</segment><segment>user-controlled</segment><segment>identifier</segment><segment>points</segment><segment>to</segment><segment>a</segment><segment>protected</segment><segment>object</segment><segment>[3],</segment><segment>[4],</segment><segment>[16]-[18].</segment><segment>Similarly,</segment><segment>session</segment><segment>misuse</segment><segment>may</segment><segment>include</segment><segment>insufficient</segment><segment>session</segment><segment>expiration,</segment><segment>reuse</segment><segment>of</segment><segment>tokens</segment><segment>after</segment><segment>logout,</segment><segment>fixation,</segment><segment>privilege</segment><segment>transition</segment><segment>failures,</segment><segment>or</segment><segment>incomplete</segment><segment>invalidation</segment><segment>after</segment><segment>account</segment><segment>changes</segment><segment>[15],</segment><segment>[21]-[23].</segment><segment>Workflow</segment><segment>bypass</segment><segment>refers</segment><segment>to</segment><segment>reaching</segment><segment>an</segment><segment>endpoint</segment><segment>or</segment><segment>state</segment><segment>transition</segment><segment>without</segment><segment>satisfying</segment><segment>preconditions</segment><segment>such</segment><segment>as</segment><segment>payment,</segment><segment>approval,</segment><segment>verification,</segment><segment>or</segment><segment>reauthentication.</segment><segment>2.2</segment><segment>Review</segment><segment>of</segment><segment>Recent</segment><segment>Studies</segment><segment>Research</segment><segment>on</segment><segment>access-control</segment><segment>vulnerability</segment><segment>detection</segment><segment>has</segment><segment>developed</segment><segment>through</segment><segment>static</segment><segment>analysis,</segment><segment>black-box</segment><segment>testing,</segment><segment>role-differential</segment><segment>analysis,</segment><segment>model</segment><segment>inference,</segment><segment>and</segment><segment>workflow-based</segment><segment>reasoning.</segment><segment>Sun</segment><segment>et</segment><segment>al.</segment><segment>proposed</segment><segment>static</segment><segment>detection</segment><segment>of</segment><segment>access-control</segment><segment>vulnerabilities</segment><segment>by</segment><segment>inferring</segment><segment>role-based</segment><segment>access</segment><segment>assumptions</segment><segment>from</segment><segment>code</segment><segment>[29].</segment><segment>Li</segment><segment>and</segment><segment>Xue</segment><segment>introduced</segment><segment>BLOCK,</segment><segment>a</segment><segment>black-box</segment><segment>approach</segment><segment>for</segment><segment>detecting</segment><segment>state</segment><segment>violation</segment><segment>attacks</segment><segment>by</segment><segment>observing</segment><segment>normal</segment><segment>behavior</segment><segment>and</segment><segment>identifying</segment><segment>invariant</segment><segment>violations</segment><segment>[30].</segment><segment>Felmetsger</segment><segment>et</segment><segment>al.</segment><segment>highlighted</segment><segment>that</segment><segment>logic</segment><segment>vulnerabilities</segment><segment>receive</segment><segment>less</segment><segment>attention</segment><segment>than</segment><segment>classic</segment><segment>input-validation</segment><segment>flaws,</segment><segment>even</segment><segment>though</segment><segment>they</segment><segment>can</segment><segment>cause</segment><segment>serious</segment><segment>security</segment><segment>failures</segment><segment>[31].</segment><segment>Pellegrino</segment><segment>and</segment><segment>Balzarotti</segment><segment>examined</segment><segment>black-box</segment><segment>detection</segment><segment>of</segment><segment>logic</segment><segment>flaws</segment><segment>using</segment><segment>behavioral</segment><segment>patterns</segment><segment>extracted</segment><segment>from</segment><segment>interactions</segment><segment>[32].</segment><segment>More</segment><segment>recent</segment><segment>work</segment><segment>continues</segment><segment>to</segment><segment>show</segment><segment>that</segment><segment>authorization</segment><segment>flaws</segment><segment>are</segment><segment>difficult</segment><segment>to</segment><segment>evaluate</segment><segment>without</segment><segment>stateful</segment><segment>context.</segment><segment>Rennhard</segment><segment>et</segment><segment>al.</segment><segment>presented</segment><segment>an</segment><segment>approach</segment><segment>to</segment><segment>automatically</segment><segment>detect</segment><segment>HTTP</segment><segment>GET</segment><segment>request-based</segment><segment>access-control</segment><segment>vulnerabilities</segment><segment>[26].</segment><segment>Zhong</segment><segment>et</segment><segment>al.</segment><segment>surveyed</segment><segment>prevention</segment><segment>and</segment><segment>detection</segment><segment>of</segment><segment>access-control</segment><segment>vulnerabilities</segment><segment>in</segment><segment>web</segment><segment>applications</segment><segment>and</segment><segment>emphasized</segment><segment>roles,</segment><segment>permissions,</segment><segment>resources,</segment><segment>and</segment><segment>business</segment><segment>logic</segment><segment>[27].</segment><segment>BACScan</segment><segment>addressed</segment><segment>black-box</segment><segment>detection</segment><segment>of</segment><segment>broken</segment><segment>access-control</segment><segment>vulnerabilities</segment><segment>and</segment><segment>reinforced</segment><segment>the</segment><segment>need</segment><segment>to</segment><segment>consider</segment><segment>multiple</segment><segment>users</segment><segment>and</segment><segment>permissions</segment><segment>[28].</segment><segment>SWaTEval</segment><segment>proposed</segment><segment>an</segment><segment>evaluation</segment><segment>framework</segment><segment>for</segment><segment>stateful</segment><segment>web</segment><segment>application</segment><segment>testing,</segment><segment>and</segment><segment>ProFuzzBench</segment><segment>showed</segment><segment>the</segment><segment>value</segment><segment>of</segment><segment>explicit</segment><segment>benchmarks</segment><segment>for</segment><segment>stateful</segment><segment>protocol</segment><segment>fuzzing</segment><segment>even</segment><segment>outside</segment><segment>web</segment><segment>authorization</segment><segment>[35],</segment><segment>[36].</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>8</segment><segment>Benchmarking</segment><segment>literature</segment><segment>also</segment><segment>motivates</segment><segment>AuthStateBench.</segment><segment>OWASP</segment><segment>Benchmark</segment><segment>and</segment><segment>NIST</segment><segment>SARD</segment><segment>support</segment><segment>evaluation</segment><segment>of</segment><segment>vulnerability</segment><segment>detection</segment><segment>tools,</segment><segment>while</segment><segment>Juliet</segment><segment>and</segment><segment>newer</segment><segment>SARD</segment><segment>resources</segment><segment>provide</segment><segment>curated</segment><segment>software-assurance</segment><segment>test</segment><segment>cases</segment><segment>[7],</segment><segment>[9]-[11].</segment><segment>However,</segment><segment>benchmark</segment><segment>critiques</segment><segment>have</segment><segment>noted</segment><segment>that</segment><segment>benchmark</segment><segment>structure</segment><segment>can</segment><segment>shape</segment><segment>tool</segment><segment>behavior</segment><segment>and</segment><segment>may</segment><segment>not</segment><segment>always</segment><segment>represent</segment><segment>real</segment><segment>semantic</segment><segment>vulnerabilities</segment><segment>[38]-[40].</segment><segment>AI-assisted</segment><segment>vulnerability</segment><segment>detection</segment><segment>further</segment><segment>increases</segment><segment>the</segment><segment>need</segment><segment>for</segment><segment>clearly</segment><segment>defined</segment><segment>evaluation</segment><segment>tasks</segment><segment>because</segment><segment>LLM-based</segment><segment>systems</segment><segment>may</segment><segment>appear</segment><segment>effective</segment><segment>on</segment><segment>code-level</segment><segment>benchmarks</segment><segment>while</segment><segment>struggling</segment><segment>with</segment><segment>multi-step</segment><segment>security</segment><segment>specifications,</segment><segment>contextual</segment><segment>authorization</segment><segment>rules,</segment><segment>and</segment><segment>workflow</segment><segment>semantics</segment><segment>[41]-[46].</segment><segment>2.3</segment><segment>Existing</segment><segment>Standards,</segment><segment>Frameworks,</segment><segment>and</segment><segment>Models</segment><segment>OWASP</segment><segment>Top</segment><segment>10:2025</segment><segment>and</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10:2023</segment><segment>provide</segment><segment>risk</segment><segment>taxonomies</segment><segment>that</segment><segment>place</segment><segment>broken</segment><segment>access</segment><segment>control,</segment><segment>object-level</segment><segment>authorization,</segment><segment>broken</segment><segment>authentication,</segment><segment>and</segment><segment>function-</segment><segment>level</segment><segment>authorization</segment><segment>among</segment><segment>major</segment><segment>application-security</segment><segment>concerns</segment><segment>[1]-[4].</segment><segment>OWASP</segment><segment>ASVS</segment><segment>5.0.0</segment><segment>provides</segment><segment>a</segment><segment>verification</segment><segment>standard</segment><segment>for</segment><segment>web</segment><segment>application</segment><segment>technical</segment><segment>controls</segment><segment>and</segment><segment>is</segment><segment>particularly</segment><segment>relevant</segment><segment>because</segment><segment>it</segment><segment>includes</segment><segment>requirements</segment><segment>for</segment><segment>authentication,</segment><segment>session</segment><segment>management,</segment><segment>access</segment><segment>control,</segment><segment>API</segment><segment>behavior,</segment><segment>error</segment><segment>handling,</segment><segment>logging,</segment><segment>and</segment><segment>business</segment><segment>logic</segment><segment>[5].</segment><segment>OWASP</segment><segment>WSTG</segment><segment>complements</segment><segment>ASVS</segment><segment>by</segment><segment>describing</segment><segment>testing</segment><segment>activities</segment><segment>and</segment><segment>reporting</segment><segment>expectations</segment><segment>[6].</segment><segment>NIST</segment><segment>SSDF</segment><segment>describes</segment><segment>secure</segment><segment>software</segment><segment>development</segment><segment>practices</segment><segment>for</segment><segment>mitigating</segment><segment>software</segment><segment>vulnerability</segment><segment>risk,</segment><segment>while</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>guidance</segment><segment>frames</segment><segment>secure</segment><segment>defaults,</segment><segment>product</segment><segment>accountability,</segment><segment>and</segment><segment>reduction</segment><segment>of</segment><segment>customer</segment><segment>security</segment><segment>burden</segment><segment>as</segment><segment>core</segment><segment>software</segment><segment>manufacturer</segment><segment>responsibilities</segment><segment>[8],</segment><segment>[19],</segment><segment>[20].</segment><segment>MITRE</segment><segment>CWE</segment><segment>provides</segment><segment>weakness</segment><segment>families</segment><segment>that</segment><segment>can</segment><segment>map</segment><segment>benchmark</segment><segment>scenarios</segment><segment>to</segment><segment>well-known</segment><segment>categories</segment><segment>such</segment><segment>as</segment><segment>improper</segment><segment>access</segment><segment>control,</segment><segment>improper</segment><segment>authentication,</segment><segment>missing</segment><segment>authentication</segment><segment>for</segment><segment>critical</segment><segment>function,</segment><segment>insufficient</segment><segment>session</segment><segment>expiration,</segment><segment>authorization</segment><segment>bypass</segment><segment>through</segment><segment>user-controlled</segment><segment>key,</segment><segment>missing</segment><segment>authorization,</segment><segment>and</segment><segment>incorrect</segment><segment>authorization</segment><segment>[12]-[18].</segment><segment>OAuth</segment><segment>2.0</segment><segment>security</segment><segment>best</segment><segment>current</segment><segment>practice</segment><segment>and</segment><segment>OpenID</segment><segment>Connect</segment><segment>specifications</segment><segment>help</segment><segment>ground</segment><segment>authentication</segment><segment>and</segment><segment>token</segment><segment>lifecycle</segment><segment>scenarios</segment><segment>in</segment><segment>real</segment><segment>identity</segment><segment>protocols</segment><segment>[21]-[23].</segment><segment>2.4</segment><segment>Limitations</segment><segment>of</segment><segment>Existing</segment><segment>Work</segment><segment>Existing</segment><segment>work</segment><segment>has</segment><segment>four</segment><segment>main</segment><segment>limitations</segment><segment>for</segment><segment>this</segment><segment>article's</segment><segment>purpose.</segment><segment>First,</segment><segment>many</segment><segment>benchmarks</segment><segment>emphasize</segment><segment>source-code-level</segment><segment>flaws</segment><segment>or</segment><segment>input-driven</segment><segment>vulnerabilities,</segment><segment>which</segment><segment>are</segment><segment>important</segment><segment>but</segment><segment>do</segment><segment>not</segment><segment>fully</segment><segment>capture</segment><segment>stateful</segment><segment>authorization</segment><segment>semantics.</segment><segment>Second,</segment><segment>scanner-comparison</segment><segment>studies</segment><segment>often</segment><segment>evaluate</segment><segment>whether</segment><segment>tools</segment><segment>detect</segment><segment>known</segment><segment>classes</segment><segment>without</segment><segment>documenting</segment><segment>the</segment><segment>role,</segment><segment>session,</segment><segment>object,</segment><segment>and</segment><segment>workflow</segment><segment>state</segment><segment>required</segment><segment>to</segment><segment>reproduce</segment><segment>authorization</segment><segment>failures.</segment><segment>Third,</segment><segment>access-control</segment><segment>studies</segment><segment>vary</segment><segment>in</segment><segment>their</segment><segment>threat</segment><segment>models</segment><segment>and</segment><segment>assumptions,</segment><segment>making</segment><segment>comparison</segment><segment>difficult</segment><segment>across</segment><segment>manual,</segment><segment>automated,</segment><segment>and</segment><segment>AI-assisted</segment><segment>approaches.</segment><segment>Fourth,</segment><segment>standards</segment><segment>provide</segment><segment>requirements</segment><segment>and</segment><segment>guidance</segment><segment>but</segment><segment>do</segment><segment>not</segment><segment>always</segment><segment>translate</segment><segment>them</segment><segment>into</segment><segment>benchmark-ready</segment><segment>scenario</segment><segment>templates.</segment><segment>These</segment><segment>limitations</segment><segment>do</segment><segment>not</segment><segment>reduce</segment><segment>the</segment><segment>value</segment><segment>of</segment><segment>existing</segment><segment>standards</segment><segment>or</segment><segment>benchmarks.</segment><segment>Rather,</segment><segment>they</segment><segment>identify</segment><segment>a</segment><segment>missing</segment><segment>layer</segment><segment>between</segment><segment>standards</segment><segment>and</segment><segment>tool</segment><segment>evaluation:</segment><segment>a</segment><segment>scenario-design</segment><segment>model</segment><segment>that</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>9</segment><segment>specifies</segment><segment>preconditions,</segment><segment>actors,</segment><segment>state,</segment><segment>expected</segment><segment>secure</segment><segment>behavior,</segment><segment>insecure</segment><segment>behavior,</segment><segment>evidence</segment><segment>requirements,</segment><segment>and</segment><segment>mapping</segment><segment>to</segment><segment>standards.</segment><segment>AuthStateBench</segment><segment>is</segment><segment>intended</segment><segment>to</segment><segment>provide</segment><segment>that</segment><segment>layer.</segment><segment>2.5</segment><segment>Summary</segment><segment>of</segment><segment>Research</segment><segment>Gap</segment><segment>The</segment><segment>literature</segment><segment>shows</segment><segment>strong</segment><segment>interest</segment><segment>in</segment><segment>web</segment><segment>application</segment><segment>security,</segment><segment>access-control</segment><segment>analysis,</segment><segment>scanner</segment><segment>evaluation,</segment><segment>software-assurance</segment><segment>datasets,</segment><segment>and</segment><segment>AI-assisted</segment><segment>vulnerability</segment><segment>detection.</segment><segment>It</segment><segment>also</segment><segment>shows</segment><segment>a</segment><segment>persistent</segment><segment>gap:</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>failures</segment><segment>require</segment><segment>benchmark</segment><segment>scenarios</segment><segment>that</segment><segment>encode</segment><segment>role,</segment><segment>session,</segment><segment>object</segment><segment>ownership,</segment><segment>and</segment><segment>workflow</segment><segment>conditions.</segment><segment>Without</segment><segment>such</segment><segment>encoding,</segment><segment>researchers</segment><segment>and</segment><segment>practitioners</segment><segment>risk</segment><segment>comparing</segment><segment>tools</segment><segment>and</segment><segment>methods</segment><segment>on</segment><segment>unclear</segment><segment>or</segment><segment>incomplete</segment><segment>assumptions.</segment><segment>AuthStateBench</segment><segment>responds</segment><segment>to</segment><segment>this</segment><segment>gap</segment><segment>by</segment><segment>proposing</segment><segment>a</segment><segment>structured</segment><segment>benchmark</segment><segment>design</segment><segment>rather</segment><segment>than</segment><segment>claiming</segment><segment>empirical</segment><segment>results.</segment><segment>Table</segment><segment>1.</segment><segment>Literature</segment><segment>search</segment><segment>strategy</segment><segment>and</segment><segment>source</segment><segment>categories.</segment><segment>Source</segment><segment>category</segment><segment>Academic</segment><segment>literature</segment><segment>Security</segment><segment>standards</segment><segment>and</segment><segment>guidance</segment><segment>Weakness</segment><segment>taxonomies</segment><segment>Benchmark</segment><segment>resources</segment><segment>Identity</segment><segment>and</segment><segment>risk</segment><segment>specifications</segment><segment>Examples</segment><segment>IEEE</segment><segment>Xplore,</segment><segment>ACM</segment><segment>Digital</segment><segment>Library,</segment><segment>SpringerLink,</segment><segment>ScienceDirect,</segment><segment>Wiley,</segment><segment>Taylor</segment><segment>&amp;</segment><segment>Francis,</segment><segment>Google</segment><segment>Scholar</segment><segment>discovery</segment><segment>OWASP</segment><segment>Top</segment><segment>10:2025,</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10,</segment><segment>OWASP</segment><segment>ASVS</segment><segment>5.0.0,</segment><segment>OWASP</segment><segment>WSTG,</segment><segment>NIST</segment><segment>SSDF,</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>MITRE</segment><segment>CWE</segment><segment>families</segment><segment>for</segment><segment>access</segment><segment>control,</segment><segment>authentication,</segment><segment>authorization,</segment><segment>session</segment><segment>expiration,</segment><segment>and</segment><segment>user-</segment><segment>controlled</segment><segment>keys</segment><segment>OWASP</segment><segment>Benchmark,</segment><segment>NIST</segment><segment>SARD,</segment><segment>Juliet,</segment><segment>SARD</segment><segment>documentation,</segment><segment>ProFuzzBench,</segment><segment>SWaTEval</segment><segment>OAuth</segment><segment>2.0</segment><segment>Security</segment><segment>BCP,</segment><segment>OpenID</segment><segment>Connect,</segment><segment>CVSS,</segment><segment>EPSS</segment><segment>Purpose</segment><segment>in</segment><segment>the</segment><segment>review</segment><segment>Identify</segment><segment>peer-reviewed</segment><segment>studies</segment><segment>on</segment><segment>access-control</segment><segment>testing,</segment><segment>stateful</segment><segment>web</segment><segment>testing,</segment><segment>logic</segment><segment>flaws,</segment><segment>benchmarks,</segment><segment>scanners,</segment><segment>and</segment><segment>AI-assisted</segment><segment>vulnerability</segment><segment>analysis.</segment><segment>Ground</segment><segment>scenario</segment><segment>categories</segment><segment>in</segment><segment>recognized</segment><segment>application-</segment><segment>security</segment><segment>and</segment><segment>secure-</segment><segment>development</segment><segment>expectations.</segment><segment>Map</segment><segment>benchmark</segment><segment>scenarios</segment><segment>to</segment><segment>common</segment><segment>weakness</segment><segment>identifiers</segment><segment>and</segment><segment>improve</segment><segment>traceability.</segment><segment>Compare</segment><segment>existing</segment><segment>benchmark</segment><segment>assumptions</segment><segment>with</segment><segment>the</segment><segment>proposed</segment><segment>stateful</segment><segment>scenario</segment><segment>design.</segment><segment>Support</segment><segment>authentication,</segment><segment>token</segment><segment>lifecycle,</segment><segment>session,</segment><segment>and</segment><segment>risk-</segment><segment>evidence</segment><segment>interpretation.</segment><segment>Table</segment><segment>2.</segment><segment>Inclusion</segment><segment>and</segment><segment>exclusion</segment><segment>criteria.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Criterion</segment><segment>type</segment><segment>Topic</segment><segment>relevance</segment><segment>Method</segment><segment>relevance</segment><segment>Source</segment><segment>quality</segment><segment>Time</segment><segment>period</segment><segment>Integrity</segment><segment>boundary</segment><segment>Included</segment><segment>Web</segment><segment>application</segment><segment>security,</segment><segment>API</segment><segment>security,</segment><segment>authentication,</segment><segment>authorization,</segment><segment>session</segment><segment>management,</segment><segment>workflow</segment><segment>abuse,</segment><segment>benchmark</segment><segment>design,</segment><segment>scanner</segment><segment>evaluation,</segment><segment>AI-</segment><segment>assisted</segment><segment>testing</segment><segment>Studies</segment><segment>proposing,</segment><segment>evaluating,</segment><segment>surveying,</segment><segment>or</segment><segment>systematizing</segment><segment>testing</segment><segment>methods,</segment><segment>standards,</segment><segment>benchmarks,</segment><segment>scanners,</segment><segment>taxonomies,</segment><segment>or</segment><segment>frameworks</segment><segment>Peer-reviewed</segment><segment>papers,</segment><segment>official</segment><segment>standards,</segment><segment>recognized</segment><segment>cybersecurity</segment><segment>guidance,</segment><segment>and</segment><segment>well-established</segment><segment>benchmark</segment><segment>resources</segment><segment>Primarily</segment><segment>2020-2026,</segment><segment>with</segment><segment>older</segment><segment>foundational</segment><segment>work</segment><segment>retained</segment><segment>where</segment><segment>it</segment><segment>shaped</segment><segment>access-control</segment><segment>or</segment><segment>benchmark</segment><segment>research</segment><segment>Sources</segment><segment>compatible</segment><segment>with</segment><segment>a</segment><segment>literature-based</segment><segment>design</segment><segment>article</segment><segment>without</segment><segment>fabricated</segment><segment>results</segment><segment>Page</segment><segment>10</segment><segment>Excluded</segment><segment>Generic</segment><segment>cybersecurity</segment><segment>with</segment><segment>no</segment><segment>web</segment><segment>application</segment><segment>relevance;</segment><segment>malware-only,</segment><segment>blockchain-only,</segment><segment>IoT-only,</segment><segment>or</segment><segment>network-only</segment><segment>studies.</segment><segment>Papers</segment><segment>that</segment><segment>mention</segment><segment>tools</segment><segment>without</segment><segment>explaining</segment><segment>vulnerability</segment><segment>modeling</segment><segment>or</segment><segment>test</segment><segment>design.</segment><segment>Unverifiable</segment><segment>blogs,</segment><segment>marketing</segment><segment>pages,</segment><segment>unsupported</segment><segment>claims,</segment><segment>and</segment><segment>sources</segment><segment>without</segment><segment>sufficient</segment><segment>technical</segment><segment>relevance.</segment><segment>Older</segment><segment>material</segment><segment>without</segment><segment>continuing</segment><segment>relevance</segment><segment>or</segment><segment>citation</segment><segment>value.</segment><segment>Studies</segment><segment>requiring</segment><segment>private</segment><segment>datasets,</segment><segment>unauthorized</segment><segment>testing,</segment><segment>or</segment><segment>non-reproducible</segment><segment>company-only</segment><segment>evidence.</segment><segment>Table</segment><segment>3.</segment><segment>Literature</segment><segment>comparison</segment><segment>on</segment><segment>stateful</segment><segment>web</segment><segment>security</segment><segment>testing.</segment><segment>Research</segment><segment>stream</segment><segment>Representative</segment><segment>sources</segment><segment>Strength</segment><segment>Static</segment><segment>access-control</segment><segment>analysis</segment><segment>Sun</segment><segment>et</segment><segment>al.</segment><segment>[29]</segment><segment>Can</segment><segment>infer</segment><segment>access-</segment><segment>control</segment><segment>assumptions</segment><segment>from</segment><segment>source</segment><segment>code</segment><segment>and</segment><segment>detect</segment><segment>role-related</segment><segment>weaknesses.</segment><segment>Black-box</segment><segment>state</segment><segment>or</segment><segment>BLOCK</segment><segment>[30],</segment><segment>Models</segment><segment>behavior</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>Limitation</segment><segment>addressed</segment><segment>by</segment><segment>AuthStateBench</segment><segment>Not</segment><segment>suitable</segment><segment>when</segment><segment>source</segment><segment>code</segment><segment>is</segment><segment>unavailable;</segment><segment>benchmark</segment><segment>scenarios</segment><segment>still</segment><segment>need</segment><segment>stateful</segment><segment>documentation.</segment><segment>Different</segment><segment>studies</segment><segment>use</segment><segment>G.</segment><segment>2076</segment><segment>logic</segment><segment>testing</segment><segment>Pellegrino</segment><segment>and</segment><segment>Balzarotti</segment><segment>[32],</segment><segment>Li</segment><segment>et</segment><segment>al.</segment><segment>[34]</segment><segment>from</segment><segment>interactions</segment><segment>and</segment><segment>can</segment><segment>address</segment><segment>logic</segment><segment>or</segment><segment>state</segment><segment>violations.</segment><segment>Parameter</segment><segment>tampering</segment><segment>and</segment><segment>IDOR/BOLA</segment><segment>analysis</segment><segment>NoTamper</segment><segment>[33],</segment><segment>Rennhard</segment><segment>et</segment><segment>al.</segment><segment>[26],</segment><segment>BACScan</segment><segment>[28]</segment><segment>General</segment><segment>vulnerability</segment><segment>benchmarks</segment><segment>OWASP</segment><segment>Benchmark</segment><segment>[7],</segment><segment>SARD</segment><segment>and</segment><segment>Juliet</segment><segment>[9]-[11]</segment><segment>AI-assisted</segment><segment>vulnerability</segment><segment>detection</segment><segment>Xu</segment><segment>et</segment><segment>al.</segment><segment>[41],</segment><segment>Far</segment><segment>et</segment><segment>al.</segment><segment>[42],</segment><segment>CVE-Bench</segment><segment>[44],</segment><segment>Cybench</segment><segment>[45]</segment><segment>Targets</segment><segment>object</segment><segment>identifiers,</segment><segment>request</segment><segment>parameters,</segment><segment>and</segment><segment>access-control</segment><segment>violations.</segment><segment>Useful</segment><segment>for</segment><segment>repeatable</segment><segment>tool</segment><segment>evaluation</segment><segment>and</segment><segment>known</segment><segment>test</segment><segment>cases.</segment><segment>Highlights</segment><segment>growing</segment><segment>role</segment><segment>of</segment><segment>AI</segment><segment>in</segment><segment>security</segment><segment>testing</segment><segment>and</segment><segment>exploitation</segment><segment>reasoning.</segment><segment>Page</segment><segment>11</segment><segment>different</segment><segment>assumptions;</segment><segment>AuthStateBench</segment><segment>standardizes</segment><segment>role-</segment><segment>session-object-</segment><segment>workflow</segment><segment>dimensions.</segment><segment>Object</segment><segment>ownership</segment><segment>and</segment><segment>victim/attacker</segment><segment>role</segment><segment>conditions</segment><segment>need</segment><segment>explicit</segment><segment>benchmark</segment><segment>representation.</segment><segment>Primarily</segment><segment>stronger</segment><segment>for</segment><segment>code-level</segment><segment>or</segment><segment>input-</segment><segment>driven</segment><segment>weaknesses</segment><segment>than</segment><segment>multi-user</segment><segment>workflow</segment><segment>semantics.</segment><segment>Requires</segment><segment>clearer</segment><segment>task</segment><segment>specifications</segment><segment>to</segment><segment>evaluate</segment><segment>semantic</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>behavior.</segment><segment>3.</segment><segment>Proposed</segment><segment>Framework</segment><segment>/</segment><segment>Benchmark</segment><segment>/</segment><segment>Model</segment><segment>3.1</segment><segment>Conceptual</segment><segment>Basis</segment><segment>AuthStateBench</segment><segment>is</segment><segment>built</segment><segment>on</segment><segment>the</segment><segment>premise</segment><segment>that</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>vulnerabilities</segment><segment>are</segment><segment>not</segment><segment>adequately</segment><segment>represented</segment><segment>by</segment><segment>a</segment><segment>single</segment><segment>request</segment><segment>or</segment><segment>payload.</segment><segment>They</segment><segment>must</segment><segment>be</segment><segment>represented</segment><segment>as</segment><segment>stateful</segment><segment>security-policy</segment><segment>failures.</segment><segment>The</segment><segment>benchmark</segment><segment>therefore</segment><segment>uses</segment><segment>four</segment><segment>state</segment><segment>dimensions:</segment><segment>role</segment><segment>state,</segment><segment>session</segment><segment>state,</segment><segment>object-ownership</segment><segment>state,</segment><segment>and</segment><segment>workflow</segment><segment>state.</segment><segment>Role</segment><segment>state</segment><segment>describes</segment><segment>the</segment><segment>identity</segment><segment>and</segment><segment>privilege</segment><segment>level</segment><segment>of</segment><segment>the</segment><segment>actor.</segment><segment>Session</segment><segment>state</segment><segment>describes</segment><segment>token</segment><segment>validity,</segment><segment>freshness,</segment><segment>login/logout</segment><segment>condition,</segment><segment>reauthentication</segment><segment>status,</segment><segment>and</segment><segment>privilege-transition</segment><segment>effects.</segment><segment>Object-</segment><segment>ownership</segment><segment>state</segment><segment>describes</segment><segment>whether</segment><segment>the</segment><segment>target</segment><segment>resource</segment><segment>is</segment><segment>owned</segment><segment>by,</segment><segment>shared</segment><segment>with,</segment><segment>hidden</segment><segment>from,</segment><segment>or</segment><segment>unrelated</segment><segment>to</segment><segment>the</segment><segment>actor.</segment><segment>Workflow</segment><segment>state</segment><segment>describes</segment><segment>whether</segment><segment>the</segment><segment>requested</segment><segment>action</segment><segment>occurs</segment><segment>in</segment><segment>the</segment><segment>expected</segment><segment>business</segment><segment>sequence.</segment><segment>The</segment><segment>benchmark</segment><segment>design</segment><segment>treats</segment><segment>a</segment><segment>vulnerability</segment><segment>scenario</segment><segment>as</segment><segment>a</segment><segment>controlled</segment><segment>policy</segment><segment>test.</segment><segment>Each</segment><segment>scenario</segment><segment>begins</segment><segment>with</segment><segment>a</segment><segment>documented</segment><segment>precondition,</segment><segment>an</segment><segment>attacker</segment><segment>role,</segment><segment>an</segment><segment>optional</segment><segment>victim</segment><segment>or</segment><segment>target</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>12</segment><segment>role,</segment><segment>a</segment><segment>protected</segment><segment>object,</segment><segment>a</segment><segment>session</segment><segment>condition,</segment><segment>a</segment><segment>workflow</segment><segment>condition,</segment><segment>an</segment><segment>action,</segment><segment>expected</segment><segment>secure</segment><segment>behavior,</segment><segment>observed</segment><segment>insecure</segment><segment>behavior</segment><segment>in</segment><segment>a</segment><segment>vulnerable</segment><segment>implementation,</segment><segment>and</segment><segment>a</segment><segment>standards/CWE</segment><segment>mapping.</segment><segment>This</segment><segment>approach</segment><segment>allows</segment><segment>future</segment><segment>implementation</segment><segment>without</segment><segment>relying</segment><segment>on</segment><segment>private</segment><segment>systems</segment><segment>or</segment><segment>unauthorized</segment><segment>exploitation.</segment><segment>To</segment><segment>make</segment><segment>the</segment><segment>design</segment><segment>explicit,</segment><segment>each</segment><segment>benchmark</segment><segment>scenario</segment><segment>is</segment><segment>represented</segment><segment>as</segment><segment>a</segment><segment>stateful</segment><segment>policy-test</segment><segment>tuple</segment><segment>rather</segment><segment>than</segment><segment>a</segment><segment>single</segment><segment>vulnerable</segment><segment>request:</segment><segment>B_s</segment><segment>=</segment><segment>&lt;R_s,</segment><segment>S_s,</segment><segment>O_s,</segment><segment>W_s,</segment><segment>A_s,</segment><segment>P_s,</segment><segment>E_s&gt;</segment><segment>(1)</segment><segment>where</segment><segment>R_s</segment><segment>is</segment><segment>role</segment><segment>state,</segment><segment>S_s</segment><segment>is</segment><segment>session</segment><segment>state,</segment><segment>O_s</segment><segment>is</segment><segment>object-ownership</segment><segment>state,</segment><segment>W_s</segment><segment>is</segment><segment>workflow</segment><segment>state,</segment><segment>A_s</segment><segment>is</segment><segment>the</segment><segment>attempted</segment><segment>action,</segment><segment>P_s</segment><segment>is</segment><segment>the</segment><segment>expected</segment><segment>policy</segment><segment>decision,</segment><segment>and</segment><segment>E_s</segment><segment>is</segment><segment>the</segment><segment>required</segment><segment>evidence</segment><segment>record.</segment><segment>Scenario</segment><segment>coverage</segment><segment>can</segment><segment>later</segment><segment>be</segment><segment>computed</segment><segment>as:</segment><segment>Coverage</segment><segment>=</segment><segment>|C_tested</segment><segment>∩</segment><segment>C_required|</segment><segment>/</segment><segment>|C_required|</segment><segment>(2)</segment><segment>A</segment><segment>future</segment><segment>method-comparison</segment><segment>study</segment><segment>may</segment><segment>score</segment><segment>evidence</segment><segment>quality</segment><segment>using</segment><segment>a</segment><segment>weighted</segment><segment>criterion</segment><segment>model:</segment><segment>Score_m</segment><segment>=</segment><segment>Σ(k=1..n)</segment><segment>w_k</segment><segment>x_m,k</segment><segment>(3)</segment><segment>where</segment><segment>x_m,k</segment><segment>denotes</segment><segment>whether</segment><segment>method</segment><segment>m</segment><segment>satisfies</segment><segment>criterion</segment><segment>k,</segment><segment>and</segment><segment>w_k</segment><segment>allows</segment><segment>future</segment><segment>researchers</segment><segment>to</segment><segment>prioritize</segment><segment>scenario</segment><segment>recognition,</segment><segment>precondition</segment><segment>handling,</segment><segment>evidence</segment><segment>quality,</segment><segment>false-</segment><segment>positive</segment><segment>control,</segment><segment>and</segment><segment>reproducibility.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>13</segment><segment>Fig.</segment><segment>2.</segment><segment>Four-dimensional</segment><segment>state</segment><segment>model</segment><segment>used</segment><segment>to</segment><segment>construct</segment><segment>AuthStateBench</segment><segment>scenarios.</segment><segment>3.2</segment><segment>Main</segment><segment>Components</segment><segment>AuthStateBench</segment><segment>contains</segment><segment>five</segment><segment>components.</segment><segment>The</segment><segment>first</segment><segment>component</segment><segment>is</segment><segment>the</segment><segment>scenario</segment><segment>taxonomy,</segment><segment>which</segment><segment>groups</segment><segment>benchmark</segment><segment>cases</segment><segment>into</segment><segment>recurring</segment><segment>classes</segment><segment>such</segment><segment>as</segment><segment>object-level</segment><segment>authorization</segment><segment>failure,</segment><segment>function-level</segment><segment>authorization</segment><segment>failure,</segment><segment>privilege</segment><segment>escalation,</segment><segment>session</segment><segment>lifecycle</segment><segment>failure,</segment><segment>workflow</segment><segment>bypass,</segment><segment>role-confusion</segment><segment>failure,</segment><segment>tenant-isolation</segment><segment>failure,</segment><segment>and</segment><segment>reauthentication</segment><segment>failure.</segment><segment>The</segment><segment>second</segment><segment>component</segment><segment>is</segment><segment>the</segment><segment>state</segment><segment>matrix,</segment><segment>which</segment><segment>combines</segment><segment>role,</segment><segment>session,</segment><segment>object,</segment><segment>and</segment><segment>workflow</segment><segment>conditions.</segment><segment>The</segment><segment>third</segment><segment>component</segment><segment>is</segment><segment>the</segment><segment>standards-mapping</segment><segment>layer,</segment><segment>which</segment><segment>connects</segment><segment>scenarios</segment><segment>to</segment><segment>OWASP,</segment><segment>NIST,</segment><segment>CISA,</segment><segment>MITRE,</segment><segment>OAuth,</segment><segment>and</segment><segment>OpenID</segment><segment>guidance.</segment><segment>The</segment><segment>fourth</segment><segment>component</segment><segment>is</segment><segment>the</segment><segment>scenario</segment><segment>documentation</segment><segment>template.</segment><segment>The</segment><segment>fifth</segment><segment>component</segment><segment>is</segment><segment>the</segment><segment>evaluation</segment><segment>criteria</segment><segment>set,</segment><segment>which</segment><segment>supports</segment><segment>future</segment><segment>comparison</segment><segment>of</segment><segment>manual</segment><segment>testing,</segment><segment>scanner-assisted</segment><segment>testing,</segment><segment>AI-</segment><segment>assisted</segment><segment>testing,</segment><segment>and</segment><segment>standards-based</segment><segment>review.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>14</segment><segment>These</segment><segment>components</segment><segment>are</segment><segment>designed</segment><segment>to</segment><segment>be</segment><segment>modular.</segment><segment>A</segment><segment>researcher</segment><segment>can</segment><segment>use</segment><segment>the</segment><segment>taxonomy</segment><segment>to</segment><segment>classify</segment><segment>scenarios,</segment><segment>the</segment><segment>template</segment><segment>to</segment><segment>document</segment><segment>cases,</segment><segment>the</segment><segment>standards</segment><segment>mapping</segment><segment>to</segment><segment>justify</segment><segment>relevance,</segment><segment>and</segment><segment>the</segment><segment>evaluation</segment><segment>criteria</segment><segment>to</segment><segment>compare</segment><segment>methods.</segment><segment>A</segment><segment>practitioner</segment><segment>can</segment><segment>use</segment><segment>the</segment><segment>same</segment><segment>structure</segment><segment>for</segment><segment>training,</segment><segment>secure-code</segment><segment>review,</segment><segment>and</segment><segment>controlled</segment><segment>laboratory</segment><segment>exercises.</segment><segment>Fig.</segment><segment>3</segment><segment>operationalizes</segment><segment>the</segment><segment>benchmark</segment><segment>construction</segment><segment>sequence.</segment><segment>The</segment><segment>process</segment><segment>starts</segment><segment>from</segment><segment>a</segment><segment>security</segment><segment>policy,</segment><segment>converts</segment><segment>it</segment><segment>into</segment><segment>allowed</segment><segment>and</segment><segment>denied</segment><segment>state</segment><segment>pairs,</segment><segment>records</segment><segment>evidence,</segment><segment>maps</segment><segment>the</segment><segment>scenario</segment><segment>to</segment><segment>standards,</segment><segment>and</segment><segment>then</segment><segment>allows</segment><segment>a</segment><segment>future</segment><segment>evaluator</segment><segment>to</segment><segment>compare</segment><segment>testing</segment><segment>methods.</segment><segment>Fig.</segment><segment>3.</segment><segment>Benchmark</segment><segment>scenario</segment><segment>construction</segment><segment>and</segment><segment>evaluation</segment><segment>pipeline.</segment><segment>3.3</segment><segment>Standards</segment><segment>or</segment><segment>Literature</segment><segment>Mapping</segment><segment>The</segment><segment>standards-mapping</segment><segment>layer</segment><segment>is</segment><segment>essential</segment><segment>because</segment><segment>it</segment><segment>prevents</segment><segment>the</segment><segment>benchmark</segment><segment>from</segment><segment>becoming</segment><segment>an</segment><segment>arbitrary</segment><segment>list</segment><segment>of</segment><segment>invented</segment><segment>scenarios.</segment><segment>Broken</segment><segment>access</segment><segment>control</segment><segment>maps</segment><segment>to</segment><segment>OWASP</segment><segment>A01:2025</segment><segment>and</segment><segment>to</segment><segment>API-level</segment><segment>risks</segment><segment>such</segment><segment>as</segment><segment>BOLA</segment><segment>and</segment><segment>BFLA</segment><segment>[2]-[4].</segment><segment>Authentication</segment><segment>and</segment><segment>session-management</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>15</segment><segment>scenarios</segment><segment>map</segment><segment>to</segment><segment>ASVS</segment><segment>requirements,</segment><segment>OAuth</segment><segment>2.0</segment><segment>security</segment><segment>guidance,</segment><segment>OpenID</segment><segment>Connect,</segment><segment>and</segment><segment>CWE</segment><segment>categories</segment><segment>for</segment><segment>improper</segment><segment>authentication,</segment><segment>missing</segment><segment>authentication,</segment><segment>insufficient</segment><segment>session</segment><segment>expiration,</segment><segment>and</segment><segment>token</segment><segment>misuse</segment><segment>[5],</segment><segment>[13]-[15],</segment><segment>[21]-[23].</segment><segment>Secure-development</segment><segment>and</segment><segment>vulnerability-</segment><segment>management</segment><segment>relevance</segment><segment>maps</segment><segment>to</segment><segment>NIST</segment><segment>SSDF,</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design,</segment><segment>CVSS,</segment><segment>EPSS,</segment><segment>and</segment><segment>benchmark</segment><segment>literature</segment><segment>[8],</segment><segment>[19],</segment><segment>[20],</segment><segment>[24],</segment><segment>[25],</segment><segment>[37]-[40].</segment><segment>3.4</segment><segment>Evaluation</segment><segment>Logic</segment><segment>AuthStateBench</segment><segment>does</segment><segment>not</segment><segment>present</segment><segment>accuracy,</segment><segment>precision,</segment><segment>recall,</segment><segment>F1-score,</segment><segment>exploit</segment><segment>success,</segment><segment>scanner</segment><segment>results,</segment><segment>or</segment><segment>AI-agent</segment><segment>performance.</segment><segment>Instead,</segment><segment>it</segment><segment>defines</segment><segment>how</segment><segment>future</segment><segment>studies</segment><segment>can</segment><segment>evaluate</segment><segment>such</segment><segment>outcomes</segment><segment>responsibly.</segment><segment>A</segment><segment>future</segment><segment>evaluation</segment><segment>can</segment><segment>compare</segment><segment>whether</segment><segment>a</segment><segment>method</segment><segment>identifies</segment><segment>the</segment><segment>correct</segment><segment>scenario</segment><segment>class,</segment><segment>recognizes</segment><segment>the</segment><segment>required</segment><segment>preconditions,</segment><segment>distinguishes</segment><segment>authentication</segment><segment>from</segment><segment>authorization,</segment><segment>determines</segment><segment>object</segment><segment>ownership,</segment><segment>checks</segment><segment>workflow</segment><segment>order,</segment><segment>explains</segment><segment>evidence,</segment><segment>and</segment><segment>maps</segment><segment>findings</segment><segment>to</segment><segment>standards.</segment><segment>This</segment><segment>design</segment><segment>avoids</segment><segment>false</segment><segment>empirical</segment><segment>claims</segment><segment>while</segment><segment>still</segment><segment>providing</segment><segment>a</segment><segment>concrete</segment><segment>foundation</segment><segment>for</segment><segment>empirical</segment><segment>work.</segment><segment>3.5</segment><segment>Justification</segment><segment>Stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>weaknesses</segment><segment>require</segment><segment>scenario-based</segment><segment>benchmark</segment><segment>design</segment><segment>because</segment><segment>isolated</segment><segment>request</segment><segment>testing</segment><segment>is</segment><segment>insufficient.</segment><segment>For</segment><segment>example,</segment><segment>a</segment><segment>GET</segment><segment>request</segment><segment>for</segment><segment>/invoice/124</segment><segment>may</segment><segment>be</segment><segment>secure</segment><segment>for</segment><segment>the</segment><segment>owner</segment><segment>and</segment><segment>insecure</segment><segment>for</segment><segment>a</segment><segment>different</segment><segment>user.</segment><segment>A</segment><segment>POST</segment><segment>request</segment><segment>that</segment><segment>approves</segment><segment>a</segment><segment>transaction</segment><segment>may</segment><segment>be</segment><segment>correct</segment><segment>after</segment><segment>review</segment><segment>and</segment><segment>insecure</segment><segment>before</segment><segment>review.</segment><segment>A</segment><segment>session</segment><segment>token</segment><segment>may</segment><segment>be</segment><segment>valid</segment><segment>before</segment><segment>logout</segment><segment>and</segment><segment>insecure</segment><segment>if</segment><segment>accepted</segment><segment>afterward.</segment><segment>These</segment><segment>cases</segment><segment>cannot</segment><segment>be</segment><segment>benchmarked</segment><segment>by</segment><segment>request</segment><segment>shape</segment><segment>alone;</segment><segment>they</segment><segment>require</segment><segment>documented</segment><segment>state.</segment><segment>AuthStateBench</segment><segment>makes</segment><segment>this</segment><segment>state</segment><segment>explicit</segment><segment>and</segment><segment>therefore</segment><segment>improves</segment><segment>reproducibility,</segment><segment>comparability,</segment><segment>and</segment><segment>standards</segment><segment>alignment.</segment><segment>Table</segment><segment>4.</segment><segment>AuthStateBench</segment><segment>scenario</segment><segment>taxonomy.</segment><segment>Scenario</segment><segment>class</segment><segment>Core</segment><segment>failure</segment><segment>Object-level</segment><segment>authorization</segment><segment>failure</segment><segment>Function-level</segment><segment>authorization</segment><segment>failure</segment><segment>Privilege</segment><segment>escalation</segment><segment>Actor</segment><segment>accesses</segment><segment>an</segment><segment>object</segment><segment>that</segment><segment>belongs</segment><segment>to</segment><segment>another</segment><segment>user,</segment><segment>tenant,</segment><segment>or</segment><segment>role.</segment><segment>Actor</segment><segment>reaches</segment><segment>a</segment><segment>function</segment><segment>outside</segment><segment>permitted</segment><segment>role</segment><segment>or</segment><segment>permission</segment><segment>scope.</segment><segment>Actor</segment><segment>gains</segment><segment>elevated</segment><segment>capability</segment><segment>by</segment><segment>manipulating</segment><segment>role,</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>Typical</segment><segment>state</segment><segment>dimensions</segment><segment>Role</segment><segment>state</segment><segment>+</segment><segment>object</segment><segment>ownership</segment><segment>+</segment><segment>session</segment><segment>validity</segment><segment>Role</segment><segment>state</segment><segment>+</segment><segment>workflow</segment><segment>state</segment><segment>Role</segment><segment>state</segment><segment>+</segment><segment>session</segment><segment>state</segment><segment>+</segment><segment>workflow</segment><segment>state</segment><segment>Example</segment><segment>secure</segment><segment>expectation</segment><segment>The</segment><segment>server</segment><segment>checks</segment><segment>ownership</segment><segment>or</segment><segment>tenant</segment><segment>boundary</segment><segment>for</segment><segment>every</segment><segment>object</segment><segment>access.</segment><segment>The</segment><segment>server</segment><segment>enforces</segment><segment>function</segment><segment>permissions</segment><segment>independent</segment><segment>of</segment><segment>hidden</segment><segment>UI</segment><segment>controls.</segment><segment>Privilege</segment><segment>transitions</segment><segment>require</segment><segment>server-side</segment><segment>authorization</segment><segment>and</segment><segment>G.</segment><segment>2076</segment><segment>Session</segment><segment>lifecycle</segment><segment>failure</segment><segment>token,</segment><segment>endpoint,</segment><segment>or</segment><segment>transition.</segment><segment>Expired,</segment><segment>logged-out,</segment><segment>fixed,</segment><segment>or</segment><segment>stale</segment><segment>tokens</segment><segment>remain</segment><segment>usable.</segment><segment>Session</segment><segment>state</segment><segment>+</segment><segment>role</segment><segment>state</segment><segment>Workflow</segment><segment>bypass</segment><segment>Actor</segment><segment>skips</segment><segment>or</segment><segment>reorders</segment><segment>required</segment><segment>process</segment><segment>steps.</segment><segment>Workflow</segment><segment>state</segment><segment>+</segment><segment>role</segment><segment>state</segment><segment>+</segment><segment>object</segment><segment>ownership</segment><segment>Role-confusion</segment><segment>failure</segment><segment>Tenant-isolation</segment><segment>failure</segment><segment>Reauthentication</segment><segment>failure</segment><segment>Role</segment><segment>state</segment><segment>+</segment><segment>session</segment><segment>state</segment><segment>Object</segment><segment>ownership</segment><segment>+</segment><segment>role</segment><segment>state</segment><segment>Session</segment><segment>state</segment><segment>+</segment><segment>workflow</segment><segment>state</segment><segment>Application</segment><segment>confuses</segment><segment>guest,</segment><segment>user,</segment><segment>privileged</segment><segment>user,</segment><segment>admin,</segment><segment>or</segment><segment>downgraded</segment><segment>role.</segment><segment>Actor</segment><segment>crosses</segment><segment>organization,</segment><segment>workspace,</segment><segment>or</segment><segment>tenant</segment><segment>boundary.</segment><segment>Sensitive</segment><segment>action</segment><segment>proceeds</segment><segment>without</segment><segment>fresh</segment><segment>authentication</segment><segment>or</segment><segment>step-up</segment><segment>verification.</segment><segment>Page</segment><segment>16</segment><segment>reauthentication</segment><segment>where</segment><segment>appropriate.</segment><segment>Tokens</segment><segment>are</segment><segment>invalidated</segment><segment>and</segment><segment>refreshed</segment><segment>according</segment><segment>to</segment><segment>security</segment><segment>requirements.</segment><segment>Business</segment><segment>operations</segment><segment>require</segment><segment>all</segment><segment>preconditions</segment><segment>and</segment><segment>state</segment><segment>transitions.</segment><segment>Server-side</segment><segment>policy</segment><segment>resolves</segment><segment>role</segment><segment>correctly</segment><segment>after</segment><segment>login,</segment><segment>logout,</segment><segment>downgrade,</segment><segment>or</segment><segment>account</segment><segment>changes.</segment><segment>Tenant</segment><segment>boundary</segment><segment>is</segment><segment>enforced</segment><segment>for</segment><segment>every</segment><segment>resource</segment><segment>and</segment><segment>function.</segment><segment>High-risk</segment><segment>operations</segment><segment>require</segment><segment>fresh</segment><segment>identity</segment><segment>assurance</segment><segment>or</segment><segment>equivalent</segment><segment>control.</segment><segment>Table</segment><segment>5.</segment><segment>Role-session-object-workflow</segment><segment>state</segment><segment>matrix.</segment><segment>Role</segment><segment>state</segment><segment>Dimension</segment><segment>Session</segment><segment>state</segment><segment>Representative</segment><segment>states</segment><segment>Guest,</segment><segment>registered</segment><segment>user,</segment><segment>privileged</segment><segment>user,</segment><segment>admin,</segment><segment>downgraded</segment><segment>user,</segment><segment>service</segment><segment>account</segment><segment>Valid,</segment><segment>expired,</segment><segment>reused,</segment><segment>fixed,</segment><segment>logged</segment><segment>out,</segment><segment>token</segment><segment>changed,</segment><segment>privilege</segment><segment>changed,</segment><segment>reauthenticated</segment><segment>Object-ownership</segment><segment>Owned</segment><segment>object,</segment><segment>unowned</segment><segment>object,</segment><segment>state</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>Security</segment><segment>question</segment><segment>Failure</segment><segment>indicator</segment><segment>Is</segment><segment>the</segment><segment>actor</segment><segment>allowed</segment><segment>to</segment><segment>perform</segment><segment>this</segment><segment>function?</segment><segment>Is</segment><segment>the</segment><segment>session</segment><segment>state</segment><segment>acceptable</segment><segment>for</segment><segment>the</segment><segment>requested</segment><segment>action?</segment><segment>Function</segment><segment>succeeds</segment><segment>for</segment><segment>a</segment><segment>role</segment><segment>outside</segment><segment>intended</segment><segment>permission</segment><segment>scope.</segment><segment>Action</segment><segment>succeeds</segment><segment>with</segment><segment>stale,</segment><segment>invalid,</segment><segment>fixed,</segment><segment>or</segment><segment>insufficiently</segment><segment>fresh</segment><segment>session</segment><segment>context.</segment><segment>Does</segment><segment>the</segment><segment>actor</segment><segment>have</segment><segment>rights</segment><segment>over</segment><segment>this</segment><segment>Object</segment><segment>data</segment><segment>or</segment><segment>action</segment><segment>succeeds</segment><segment>across</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>17</segment><segment>Workflow</segment><segment>state</segment><segment>shared</segment><segment>object,</segment><segment>hidden</segment><segment>object,</segment><segment>tenant-</segment><segment>specific</segment><segment>object</segment><segment>Normal</segment><segment>sequence,</segment><segment>skipped</segment><segment>step,</segment><segment>repeated</segment><segment>step,</segment><segment>forced</segment><segment>endpoint,</segment><segment>post-</segment><segment>approval</segment><segment>state,</segment><segment>rollback</segment><segment>state</segment><segment>specific</segment><segment>object</segment><segment>instance?</segment><segment>ownership</segment><segment>or</segment><segment>tenant</segment><segment>boundary.</segment><segment>Has</segment><segment>the</segment><segment>process</segment><segment>reached</segment><segment>the</segment><segment>required</segment><segment>business</segment><segment>state?</segment><segment>Endpoint</segment><segment>allows</segment><segment>action</segment><segment>before</segment><segment>required</segment><segment>preconditions</segment><segment>or</segment><segment>after</segment><segment>invalid</segment><segment>transition.</segment><segment>Table</segment><segment>6.</segment><segment>OWASP</segment><segment>Top</segment><segment>10</segment><segment>/</segment><segment>ASVS</segment><segment>/</segment><segment>NIST</segment><segment>SSDF</segment><segment>/</segment><segment>CWE</segment><segment>mapping</segment><segment>table.</segment><segment>Benchmark</segment><segment>class</segment><segment>Object-level</segment><segment>authorization</segment><segment>failure</segment><segment>OWASP</segment><segment>mapping</segment><segment>OWASP</segment><segment>A01:2025;</segment><segment>API1:2023</segment><segment>BOLA</segment><segment>ASVS</segment><segment>/</segment><segment>WSTG</segment><segment>mapping</segment><segment>Access</segment><segment>control</segment><segment>and</segment><segment>API</segment><segment>testing</segment><segment>requirements</segment><segment>Function-level</segment><segment>authorization</segment><segment>failure</segment><segment>OWASP</segment><segment>A01:2025;</segment><segment>API5:2023</segment><segment>BFLA</segment><segment>Authentication</segment><segment>workflow</segment><segment>failure</segment><segment>Session</segment><segment>lifecycle</segment><segment>failure</segment><segment>OWASP</segment><segment>authentication-</segment><segment>related</segment><segment>risks;</segment><segment>API2:2023</segment><segment>Broken</segment><segment>Authentication</segment><segment>Broken</segment><segment>access</segment><segment>control</segment><segment>and</segment><segment>authentication-</segment><segment>adjacent</segment><segment>risk</segment><segment>Workflow</segment><segment>bypass</segment><segment>Business</segment><segment>logic</segment><segment>abuse;</segment><segment>broken</segment><segment>Server-side</segment><segment>authorization</segment><segment>verification;</segment><segment>business</segment><segment>logic</segment><segment>testing</segment><segment>Authentication</segment><segment>and</segment><segment>identity</segment><segment>verification</segment><segment>requirements</segment><segment>Session</segment><segment>management</segment><segment>verification;</segment><segment>logout</segment><segment>and</segment><segment>timeout</segment><segment>testing</segment><segment>Business</segment><segment>logic</segment><segment>and</segment><segment>workflow</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>NIST</segment><segment>/</segment><segment>CISA</segment><segment>mapping</segment><segment>SSDF</segment><segment>verification</segment><segment>and</segment><segment>vulnerability</segment><segment>response;</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>default</segment><segment>protection</segment><segment>Secure</segment><segment>design</segment><segment>review</segment><segment>and</segment><segment>threat</segment><segment>modeling</segment><segment>CWE</segment><segment>mapping</segment><segment>CWE-284,</segment><segment>CWE-862,</segment><segment>CWE-863,</segment><segment>CWE-639</segment><segment>CWE-862,</segment><segment>CWE-863</segment><segment>SSDF</segment><segment>secure</segment><segment>design</segment><segment>and</segment><segment>verification</segment><segment>CWE-287,</segment><segment>CWE-306</segment><segment>Secure</segment><segment>default</segment><segment>session</segment><segment>behavior</segment><segment>CWE-613,</segment><segment>CWE-287</segment><segment>Threat</segment><segment>modeling</segment><segment>and</segment><segment>secure</segment><segment>CWE-840,</segment><segment>CWE-863,</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>18</segment><segment>access</segment><segment>control</segment><segment>Broken</segment><segment>access</segment><segment>control;</segment><segment>API</segment><segment>object-level</segment><segment>access</segment><segment>control</segment><segment>Broken</segment><segment>access</segment><segment>control;</segment><segment>authentication</segment><segment>control</segment><segment>weakness</segment><segment>testing</segment><segment>Access</segment><segment>control</segment><segment>and</segment><segment>data</segment><segment>isolation</segment><segment>verification</segment><segment>Fresh</segment><segment>authentication</segment><segment>for</segment><segment>sensitive</segment><segment>actions</segment><segment>requirements</segment><segment>Secure</segment><segment>architecture</segment><segment>and</segment><segment>product</segment><segment>safety</segment><segment>CWE-862</segment><segment>CWE-284,</segment><segment>CWE-862,</segment><segment>CWE-863</segment><segment>Identity</segment><segment>assurance</segment><segment>and</segment><segment>secure</segment><segment>defaults</segment><segment>CWE-287,</segment><segment>CWE-306</segment><segment>Table</segment><segment>7.</segment><segment>Benchmark</segment><segment>scenario</segment><segment>template.</segment><segment>Tenant-isolation</segment><segment>failure</segment><segment>Reauthentication</segment><segment>failure</segment><segment>Field</segment><segment>Scenario</segment><segment>ID</segment><segment>Scenario</segment><segment>class</segment><segment>Attacker</segment><segment>role</segment><segment>Victim/target</segment><segment>role</segment><segment>Object</segment><segment>ownership</segment><segment>condition</segment><segment>Session</segment><segment>condition</segment><segment>Workflow</segment><segment>precondition</segment><segment>Attack</segment><segment>action</segment><segment>Expected</segment><segment>secure</segment><segment>behavior</segment><segment>Insecure</segment><segment>behavior</segment><segment>Standards</segment><segment>mapping</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>Description</segment><segment>Unique</segment><segment>identifier</segment><segment>such</segment><segment>as</segment><segment>ASB-OBJ-001</segment><segment>or</segment><segment>ASB-SES-003.</segment><segment>Taxonomy</segment><segment>category,</segment><segment>such</segment><segment>as</segment><segment>object-level</segment><segment>authorization</segment><segment>failure</segment><segment>or</segment><segment>session</segment><segment>lifecycle</segment><segment>failure.</segment><segment>The</segment><segment>role</segment><segment>from</segment><segment>which</segment><segment>the</segment><segment>unauthorized</segment><segment>action</segment><segment>is</segment><segment>attempted.</segment><segment>The</segment><segment>role</segment><segment>or</segment><segment>account</segment><segment>owning</segment><segment>the</segment><segment>target</segment><segment>resource,</segment><segment>if</segment><segment>applicable.</segment><segment>Owned,</segment><segment>unowned,</segment><segment>shared,</segment><segment>hidden,</segment><segment>cross-</segment><segment>tenant,</segment><segment>or</segment><segment>system-owned</segment><segment>object.</segment><segment>Valid,</segment><segment>expired,</segment><segment>logged</segment><segment>out,</segment><segment>token</segment><segment>refreshed,</segment><segment>privilege</segment><segment>changed,</segment><segment>stale,</segment><segment>fixed,</segment><segment>or</segment><segment>reauthenticated.</segment><segment>Normal</segment><segment>sequence,</segment><segment>skipped</segment><segment>stage,</segment><segment>repeated</segment><segment>stage,</segment><segment>forced</segment><segment>endpoint,</segment><segment>pre-approval,</segment><segment>post-</segment><segment>approval,</segment><segment>or</segment><segment>rollback.</segment><segment>Abstract</segment><segment>action</segment><segment>attempted</segment><segment>in</segment><segment>the</segment><segment>controlled</segment><segment>benchmark</segment><segment>scenario.</segment><segment>Policy</segment><segment>decision</segment><segment>that</segment><segment>should</segment><segment>occur</segment><segment>in</segment><segment>a</segment><segment>secure</segment><segment>implementation.</segment><segment>Failure</segment><segment>condition</segment><segment>that</segment><segment>marks</segment><segment>the</segment><segment>scenario</segment><segment>vulnerable</segment><segment>in</segment><segment>an</segment><segment>intentionally</segment><segment>vulnerable</segment><segment>implementation.</segment><segment>OWASP,</segment><segment>ASVS,</segment><segment>WSTG,</segment><segment>NIST,</segment><segment>CISA,</segment><segment>MITRE</segment><segment>CWE,</segment><segment>OAuth/OIDC</segment><segment>mapping</segment><segment>as</segment><segment>applicable.</segment><segment>G.</segment><segment>2076</segment><segment>Evidence</segment><segment>requirement</segment><segment>4.</segment><segment>Methodology</segment><segment>Page</segment><segment>19</segment><segment>What</segment><segment>future</segment><segment>testers</segment><segment>must</segment><segment>record:</segment><segment>request</segment><segment>sequence,</segment><segment>session</segment><segment>state,</segment><segment>role</segment><segment>pair,</segment><segment>object</segment><segment>ID</segment><segment>relation,</segment><segment>response,</segment><segment>and</segment><segment>policy</segment><segment>rationale.</segment><segment>4.1</segment><segment>Research</segment><segment>Design</segment><segment>The</segment><segment>research</segment><segment>design</segment><segment>combined</segment><segment>structured</segment><segment>literature</segment><segment>review,</segment><segment>standards</segment><segment>mapping,</segment><segment>conceptual</segment><segment>synthesis,</segment><segment>and</segment><segment>benchmark</segment><segment>design.</segment><segment>The</segment><segment>study</segment><segment>was</segment><segment>not</segment><segment>conducted</segment><segment>as</segment><segment>an</segment><segment>empirical</segment><segment>tool-</segment><segment>evaluation</segment><segment>experiment.</segment><segment>No</segment><segment>scanner</segment><segment>was</segment><segment>executed,</segment><segment>no</segment><segment>vulnerable</segment><segment>laboratory</segment><segment>was</segment><segment>deployed,</segment><segment>no</segment><segment>live</segment><segment>target</segment><segment>was</segment><segment>tested,</segment><segment>and</segment><segment>no</segment><segment>private</segment><segment>dataset</segment><segment>was</segment><segment>analyzed.</segment><segment>The</segment><segment>method</segment><segment>instead</segment><segment>used</segment><segment>literature</segment><segment>and</segment><segment>standards</segment><segment>to</segment><segment>derive</segment><segment>a</segment><segment>benchmark</segment><segment>design</segment><segment>that</segment><segment>can</segment><segment>later</segment><segment>support</segment><segment>implementation</segment><segment>and</segment><segment>evaluation.</segment><segment>This</segment><segment>design</segment><segment>is</segment><segment>appropriate</segment><segment>because</segment><segment>the</segment><segment>contribution</segment><segment>is</segment><segment>a</segment><segment>scenario-construction</segment><segment>model.</segment><segment>A</segment><segment>benchmark-design</segment><segment>article</segment><segment>must</segment><segment>first</segment><segment>define</segment><segment>what</segment><segment>counts</segment><segment>as</segment><segment>a</segment><segment>scenario,</segment><segment>what</segment><segment>security</segment><segment>property</segment><segment>is</segment><segment>being</segment><segment>tested,</segment><segment>what</segment><segment>state</segment><segment>must</segment><segment>be</segment><segment>recorded,</segment><segment>and</segment><segment>how</segment><segment>relevance</segment><segment>is</segment><segment>mapped</segment><segment>to</segment><segment>standards</segment><segment>before</segment><segment>performance</segment><segment>claims</segment><segment>can</segment><segment>be</segment><segment>evaluated.</segment><segment>4.2</segment><segment>Search</segment><segment>Strategy</segment><segment>/</segment><segment>Data</segment><segment>Source</segment><segment>Strategy</segment><segment>The</segment><segment>search</segment><segment>strategy</segment><segment>used</segment><segment>combinations</segment><segment>of</segment><segment>terms</segment><segment>such</segment><segment>as</segment><segment>“broken</segment><segment>access</segment><segment>control</segment><segment>web</segment><segment>application</segment><segment>testing,”</segment><segment>“authorization</segment><segment>vulnerability</segment><segment>benchmark,”</segment><segment>“authentication</segment><segment>workflow</segment><segment>vulnerability,”</segment><segment>“stateful</segment><segment>web</segment><segment>application</segment><segment>security</segment><segment>testing,”</segment><segment>“IDOR</segment><segment>BOLA</segment><segment>benchmark,”</segment><segment>“role-</segment><segment>based</segment><segment>access</segment><segment>control</segment><segment>web</segment><segment>vulnerability,”</segment><segment>“workflow</segment><segment>bypass</segment><segment>web</segment><segment>security,”</segment><segment>“session</segment><segment>management</segment><segment>vulnerability</segment><segment>testing,”</segment><segment>“OWASP</segment><segment>ASVS</segment><segment>access</segment><segment>control</segment><segment>requirements,”</segment><segment>“web</segment><segment>vulnerability</segment><segment>benchmark</segment><segment>evaluation,”</segment><segment>and</segment><segment>“AI-assisted</segment><segment>vulnerability</segment><segment>detection</segment><segment>benchmark.”</segment><segment>Searches</segment><segment>prioritized</segment><segment>peer-reviewed</segment><segment>databases</segment><segment>and</segment><segment>official</segment><segment>standards</segment><segment>sources.</segment><segment>Google</segment><segment>Scholar</segment><segment>was</segment><segment>used</segment><segment>for</segment><segment>discovery,</segment><segment>while</segment><segment>preference</segment><segment>was</segment><segment>given</segment><segment>to</segment><segment>publisher</segment><segment>pages,</segment><segment>official</segment><segment>project</segment><segment>pages,</segment><segment>government</segment><segment>guidance,</segment><segment>RFCs,</segment><segment>and</segment><segment>standards</segment><segment>pages</segment><segment>where</segment><segment>available.</segment><segment>The</segment><segment>source</segment><segment>base</segment><segment>included</segment><segment>academic</segment><segment>literature</segment><segment>on</segment><segment>access-control</segment><segment>analysis,</segment><segment>stateful</segment><segment>web</segment><segment>testing,</segment><segment>web</segment><segment>logic</segment><segment>flaws,</segment><segment>scanner</segment><segment>evaluation,</segment><segment>benchmarks,</segment><segment>and</segment><segment>AI-assisted</segment><segment>vulnerability</segment><segment>detection</segment><segment>[26]-[46].</segment><segment>It</segment><segment>also</segment><segment>included</segment><segment>standards</segment><segment>and</segment><segment>guidance</segment><segment>from</segment><segment>OWASP,</segment><segment>NIST,</segment><segment>MITRE,</segment><segment>CISA,</segment><segment>FIRST,</segment><segment>OAuth,</segment><segment>OpenID,</segment><segment>and</segment><segment>ISO/IEC</segment><segment>[1]-[25],</segment><segment>[47]-[49].</segment><segment>4.3</segment><segment>Inclusion</segment><segment>and</segment><segment>Exclusion</segment><segment>Criteria</segment><segment>Sources</segment><segment>were</segment><segment>included</segment><segment>when</segment><segment>they</segment><segment>focused</segment><segment>on</segment><segment>web</segment><segment>application</segment><segment>security,</segment><segment>API</segment><segment>security,</segment><segment>authentication,</segment><segment>authorization,</segment><segment>session</segment><segment>management,</segment><segment>workflow</segment><segment>abuse,</segment><segment>benchmark</segment><segment>design,</segment><segment>vulnerability</segment><segment>detection,</segment><segment>scanner</segment><segment>evaluation,</segment><segment>or</segment><segment>secure-development</segment><segment>guidance.</segment><segment>Foundational</segment><segment>older</segment><segment>sources</segment><segment>were</segment><segment>retained</segment><segment>when</segment><segment>they</segment><segment>introduced</segment><segment>important</segment><segment>concepts</segment><segment>or</segment><segment>methods</segment><segment>for</segment><segment>access-</segment><segment>control</segment><segment>vulnerability</segment><segment>detection</segment><segment>or</segment><segment>web</segment><segment>logic</segment><segment>testing.</segment><segment>Sources</segment><segment>were</segment><segment>excluded</segment><segment>when</segment><segment>they</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>20</segment><segment>focused</segment><segment>only</segment><segment>on</segment><segment>generic</segment><segment>cybersecurity,</segment><segment>malware,</segment><segment>blockchain,</segment><segment>IoT,</segment><segment>or</segment><segment>network</segment><segment>intrusion</segment><segment>without</segment><segment>web</segment><segment>application</segment><segment>relevance,</segment><segment>or</segment><segment>when</segment><segment>they</segment><segment>made</segment><segment>unsupported</segment><segment>claims</segment><segment>about</segment><segment>automation</segment><segment>replacing</segment><segment>human</segment><segment>security</segment><segment>testing.</segment><segment>4.4</segment><segment>Screening</segment><segment>or</segment><segment>Selection</segment><segment>Process</segment><segment>The</segment><segment>screening</segment><segment>process</segment><segment>followed</segment><segment>a</segment><segment>transparent</segment><segment>review</segment><segment>approach</segment><segment>rather</segment><segment>than</segment><segment>a</segment><segment>fully</segment><segment>quantified</segment><segment>PRISMA</segment><segment>systematic</segment><segment>review.</segment><segment>Because</segment><segment>exact</segment><segment>search</segment><segment>counts,</segment><segment>duplicate</segment><segment>counts,</segment><segment>and</segment><segment>exclusion</segment><segment>counts</segment><segment>were</segment><segment>not</segment><segment>recorded</segment><segment>in</segment><segment>a</segment><segment>formal</segment><segment>review</segment><segment>registry,</segment><segment>this</segment><segment>article</segment><segment>does</segment><segment>not</segment><segment>claim</segment><segment>a</segment><segment>completed</segment><segment>PRISMA</segment><segment>study.</segment><segment>Instead,</segment><segment>sources</segment><segment>were</segment><segment>screened</segment><segment>by</segment><segment>title,</segment><segment>abstract,</segment><segment>technical</segment><segment>relevance,</segment><segment>standards</segment><segment>relevance,</segment><segment>and</segment><segment>contribution</segment><segment>to</segment><segment>scenario</segment><segment>modeling.</segment><segment>Selected</segment><segment>sources</segment><segment>were</segment><segment>then</segment><segment>coded</segment><segment>according</segment><segment>to</segment><segment>vulnerability</segment><segment>type,</segment><segment>testing</segment><segment>approach,</segment><segment>state</segment><segment>dimension,</segment><segment>benchmark</segment><segment>relevance,</segment><segment>and</segment><segment>standards</segment><segment>applicability.</segment><segment>4.5</segment><segment>Coding</segment><segment>and</segment><segment>Synthesis</segment><segment>Method</segment><segment>Thematic</segment><segment>synthesis</segment><segment>grouped</segment><segment>the</segment><segment>literature</segment><segment>into</segment><segment>four</segment><segment>state</segment><segment>dimensions:</segment><segment>role</segment><segment>state,</segment><segment>session</segment><segment>state,</segment><segment>object-ownership</segment><segment>state,</segment><segment>and</segment><segment>workflow</segment><segment>state.</segment><segment>Role</segment><segment>state</segment><segment>captured</segment><segment>guest,</segment><segment>user,</segment><segment>privileged</segment><segment>user,</segment><segment>admin,</segment><segment>downgraded</segment><segment>user,</segment><segment>and</segment><segment>service-account</segment><segment>contexts.</segment><segment>Session</segment><segment>state</segment><segment>captured</segment><segment>valid,</segment><segment>expired,</segment><segment>reused,</segment><segment>fixed,</segment><segment>logged-out,</segment><segment>token-changed,</segment><segment>and</segment><segment>reauthenticated</segment><segment>contexts.</segment><segment>Object</segment><segment>state</segment><segment>captured</segment><segment>owned,</segment><segment>unowned,</segment><segment>shared,</segment><segment>hidden,</segment><segment>tenant-specific,</segment><segment>and</segment><segment>system-owned</segment><segment>objects.</segment><segment>Workflow</segment><segment>state</segment><segment>captured</segment><segment>normal</segment><segment>sequence,</segment><segment>skipped</segment><segment>step,</segment><segment>repeated</segment><segment>step,</segment><segment>forced</segment><segment>endpoint,</segment><segment>pre-approval,</segment><segment>post-</segment><segment>approval,</segment><segment>and</segment><segment>rollback</segment><segment>conditions.</segment><segment>Fig.</segment><segment>4</segment><segment>illustrates</segment><segment>how</segment><segment>literature,</segment><segment>standards,</segment><segment>and</segment><segment>weakness</segment><segment>taxonomies</segment><segment>were</segment><segment>synthesized</segment><segment>into</segment><segment>the</segment><segment>benchmark</segment><segment>outputs.</segment><segment>The</segment><segment>figure</segment><segment>also</segment><segment>makes</segment><segment>clear</segment><segment>that</segment><segment>the</segment><segment>article</segment><segment>is</segment><segment>a</segment><segment>design</segment><segment>study</segment><segment>rather</segment><segment>than</segment><segment>a</segment><segment>tool-execution</segment><segment>experiment.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>21</segment><segment>Fig.</segment><segment>4.</segment><segment>Literature</segment><segment>and</segment><segment>standards</segment><segment>synthesis</segment><segment>process</segment><segment>used</segment><segment>to</segment><segment>derive</segment><segment>AuthStateBench.</segment><segment>Algorithm</segment><segment>1.</segment><segment>AuthStateBench</segment><segment>scenario</segment><segment>construction</segment><segment>procedure.</segment><segment>Input:</segment><segment>Candidate</segment><segment>weakness</segment><segment>pattern,</segment><segment>relevant</segment><segment>standard</segment><segment>clauses,</segment><segment>state</segment><segment>dimensions,</segment><segment>and</segment><segment>expected</segment><segment>security</segment><segment>policy.</segment><segment>1.</segment><segment>Identify</segment><segment>the</segment><segment>protected</segment><segment>action</segment><segment>and</segment><segment>target</segment><segment>object.</segment><segment>2.</segment><segment>Define</segment><segment>the</segment><segment>legitimate</segment><segment>role,</segment><segment>unauthorized</segment><segment>role,</segment><segment>session</segment><segment>condition,</segment><segment>and</segment><segment>workflow</segment><segment>precondition.</segment><segment>3.</segment><segment>Specify</segment><segment>the</segment><segment>expected</segment><segment>secure</segment><segment>decision</segment><segment>and</segment><segment>vulnerable</segment><segment>behavior</segment><segment>to</segment><segment>be</segment><segment>represented</segment><segment>in</segment><segment>a</segment><segment>controlled</segment><segment>implementation.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>22</segment><segment>4.</segment><segment>Map</segment><segment>the</segment><segment>scenario</segment><segment>to</segment><segment>OWASP,</segment><segment>ASVS/WSTG,</segment><segment>NIST/CISA,</segment><segment>MITRE</segment><segment>CWE,</segment><segment>and</segment><segment>identity-</segment><segment>protocol</segment><segment>guidance</segment><segment>where</segment><segment>applicable.</segment><segment>5.</segment><segment>Record</segment><segment>evidence</segment><segment>requirements:</segment><segment>actor</segment><segment>role,</segment><segment>object</segment><segment>relation,</segment><segment>session</segment><segment>state,</segment><segment>request</segment><segment>sequence,</segment><segment>response,</segment><segment>and</segment><segment>policy</segment><segment>rationale.</segment><segment>Output:</segment><segment>A</segment><segment>benchmark-ready</segment><segment>scenario</segment><segment>record</segment><segment>that</segment><segment>can</segment><segment>later</segment><segment>be</segment><segment>implemented</segment><segment>and</segment><segment>evaluated</segment><segment>in</segment><segment>a</segment><segment>controlled</segment><segment>testbed.</segment><segment>After</segment><segment>coding,</segment><segment>recurring</segment><segment>vulnerability</segment><segment>patterns</segment><segment>were</segment><segment>converted</segment><segment>into</segment><segment>benchmark</segment><segment>scenario</segment><segment>classes.</segment><segment>Each</segment><segment>scenario</segment><segment>class</segment><segment>was</segment><segment>checked</segment><segment>against</segment><segment>relevant</segment><segment>standards</segment><segment>and</segment><segment>weakness</segment><segment>taxonomies</segment><segment>to</segment><segment>verify</segment><segment>that</segment><segment>it</segment><segment>corresponded</segment><segment>to</segment><segment>recognized</segment><segment>security</segment><segment>concerns</segment><segment>rather</segment><segment>than</segment><segment>arbitrary</segment><segment>examples.</segment><segment>4.6</segment><segment>Comparison</segment><segment>Criteria</segment><segment>Existing</segment><segment>approaches</segment><segment>were</segment><segment>compared</segment><segment>using</segment><segment>standards</segment><segment>alignment,</segment><segment>explicit</segment><segment>state</segment><segment>modeling,</segment><segment>reproducibility,</segment><segment>evaluation</segment><segment>readiness,</segment><segment>evidence</segment><segment>requirements,</segment><segment>ability</segment><segment>to</segment><segment>support</segment><segment>manual</segment><segment>testing,</segment><segment>ability</segment><segment>to</segment><segment>support</segment><segment>scanner-assisted</segment><segment>testing,</segment><segment>ability</segment><segment>to</segment><segment>support</segment><segment>AI-assisted</segment><segment>testing,</segment><segment>and</segment><segment>suitability</segment><segment>for</segment><segment>secure-development</segment><segment>education.</segment><segment>These</segment><segment>criteria</segment><segment>were</segment><segment>selected</segment><segment>because</segment><segment>a</segment><segment>benchmark</segment><segment>design</segment><segment>must</segment><segment>be</segment><segment>useful</segment><segment>across</segment><segment>research</segment><segment>and</segment><segment>practice,</segment><segment>not</segment><segment>only</segment><segment>within</segment><segment>a</segment><segment>single</segment><segment>tool</segment><segment>category.</segment><segment>4.7</segment><segment>Validity</segment><segment>and</segment><segment>Reliability</segment><segment>Validity</segment><segment>was</segment><segment>supported</segment><segment>through</segment><segment>triangulation</segment><segment>across</segment><segment>peer-reviewed</segment><segment>literature,</segment><segment>official</segment><segment>standards,</segment><segment>weakness</segment><segment>taxonomies,</segment><segment>and</segment><segment>benchmark</segment><segment>resources.</segment><segment>Reliability</segment><segment>was</segment><segment>supported</segment><segment>by</segment><segment>using</segment><segment>explicit</segment><segment>scenario</segment><segment>fields</segment><segment>and</segment><segment>state</segment><segment>dimensions</segment><segment>rather</segment><segment>than</segment><segment>narrative-only</segment><segment>descriptions.</segment><segment>The</segment><segment>main</segment><segment>validity</segment><segment>limitation</segment><segment>is</segment><segment>that</segment><segment>the</segment><segment>benchmark</segment><segment>has</segment><segment>not</segment><segment>yet</segment><segment>been</segment><segment>implemented</segment><segment>as</segment><segment>runnable</segment><segment>vulnerable</segment><segment>applications</segment><segment>or</segment><segment>evaluated</segment><segment>by</segment><segment>independent</segment><segment>experts.</segment><segment>A</segment><segment>recommended</segment><segment>next</segment><segment>step</segment><segment>is</segment><segment>expert</segment><segment>review</segment><segment>by</segment><segment>application-security</segment><segment>researchers,</segment><segment>professional</segment><segment>penetration</segment><segment>testers,</segment><segment>and</segment><segment>secure</segment><segment>software</segment><segment>engineers.</segment><segment>4.8</segment><segment>Ethical</segment><segment>Considerations</segment><segment>The</segment><segment>study</segment><segment>does</segment><segment>not</segment><segment>involve</segment><segment>human</segment><segment>subjects,</segment><segment>real</segment><segment>user</segment><segment>data,</segment><segment>live-system</segment><segment>testing,</segment><segment>unauthorized</segment><segment>access,</segment><segment>exploit</segment><segment>deployment,</segment><segment>screenshots,</segment><segment>tool</segment><segment>execution,</segment><segment>or</segment><segment>private</segment><segment>vulnerability</segment><segment>findings.</segment><segment>Scenarios</segment><segment>are</segment><segment>described</segment><segment>abstractly</segment><segment>and</segment><segment>are</segment><segment>intended</segment><segment>for</segment><segment>controlled</segment><segment>educational</segment><segment>or</segment><segment>research</segment><segment>environments.</segment><segment>Any</segment><segment>future</segment><segment>implementation</segment><segment>should</segment><segment>use</segment><segment>intentionally</segment><segment>vulnerable</segment><segment>applications,</segment><segment>local</segment><segment>testbeds,</segment><segment>explicit</segment><segment>permission,</segment><segment>and</segment><segment>responsible</segment><segment>disclosure</segment><segment>principles</segment><segment>where</segment><segment>applicable.</segment><segment>Table</segment><segment>8.</segment><segment>Evaluation</segment><segment>criteria</segment><segment>for</segment><segment>manual,</segment><segment>scanner-assisted,</segment><segment>and</segment><segment>AI-assisted</segment><segment>testing.</segment><segment>Criterion</segment><segment>Manual</segment><segment>testing</segment><segment>Scanner-</segment><segment>Scenario</segment><segment>recognition</segment><segment>Tester</segment><segment>identifies</segment><segment>role,</segment><segment>session,</segment><segment>object,</segment><segment>and</segment><segment>workflow</segment><segment>assisted</segment><segment>testing</segment><segment>Tool</segment><segment>must</segment><segment>discover</segment><segment>or</segment><segment>be</segment><segment>configured</segment><segment>with</segment><segment>relevant</segment><segment>state.</segment><segment>AI-assisted</segment><segment>testing</segment><segment>Model</segment><segment>must</segment><segment>infer</segment><segment>or</segment><segment>be</segment><segment>provided</segment><segment>with</segment><segment>scenario</segment><segment>state.</segment><segment>Standards-</segment><segment>based</segment><segment>review</segment><segment>Reviewer</segment><segment>checks</segment><segment>whether</segment><segment>requirement</segment><segment>coverage</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Precondition</segment><segment>handling</segment><segment>conditions.</segment><segment>Strong</segment><segment>when</segment><segment>testers</segment><segment>control</segment><segment>accounts</segment><segment>and</segment><segment>workflows.</segment><segment>Evidence</segment><segment>quality</segment><segment>Request</segment><segment>sequence,</segment><segment>account</segment><segment>roles,</segment><segment>object</segment><segment>relation,</segment><segment>and</segment><segment>response</segment><segment>evidence.</segment><segment>Human</segment><segment>judgment</segment><segment>can</segment><segment>validate</segment><segment>business</segment><segment>context.</segment><segment>Reproducibility</segment><segment>Requires</segment><segment>False-positive</segment><segment>control</segment><segment>documented</segment><segment>steps</segment><segment>and</segment><segment>accounts.</segment><segment>Often</segment><segment>limited</segment><segment>without</segment><segment>authenticated</segment><segment>crawling</segment><segment>and</segment><segment>multi-user</segment><segment>support.</segment><segment>Automated</segment><segment>traces</segment><segment>plus</segment><segment>manual</segment><segment>confirmation.</segment><segment>May</segment><segment>flag</segment><segment>request</segment><segment>differences</segment><segment>without</segment><segment>understanding</segment><segment>policy.</segment><segment>Requires</segment><segment>stable</segment><segment>crawler</segment><segment>state</segment><segment>and</segment><segment>login/session</segment><segment>handling.</segment><segment>Best</segment><segment>use</segment><segment>Deep</segment><segment>semantic</segment><segment>testing</segment><segment>and</segment><segment>business-logic</segment><segment>reasoning.</segment><segment>Broad</segment><segment>coverage</segment><segment>and</segment><segment>repeatable</segment><segment>baseline</segment><segment>scanning.</segment><segment>Variable;</segment><segment>depends</segment><segment>on</segment><segment>prompts,</segment><segment>context</segment><segment>windows,</segment><segment>and</segment><segment>tool</segment><segment>integration.</segment><segment>Explanation</segment><segment>must</segment><segment>cite</segment><segment>observed</segment><segment>evidence,</segment><segment>not</segment><segment>only</segment><segment>plausible</segment><segment>reasoning.</segment><segment>May</segment><segment>hallucinate</segment><segment>policy</segment><segment>unless</segment><segment>constrained</segment><segment>by</segment><segment>evidence.</segment><segment>Requires</segment><segment>fixed</segment><segment>prompts,</segment><segment>logs,</segment><segment>and</segment><segment>scenario</segment><segment>context.</segment><segment>Assisted</segment><segment>reasoning,</segment><segment>test</segment><segment>planning,</segment><segment>and</segment><segment>evidence</segment><segment>summarization.</segment><segment>Page</segment><segment>23</segment><segment>matches</segment><segment>scenario.</segment><segment>Strong</segment><segment>for</segment><segment>policy</segment><segment>completeness</segment><segment>but</segment><segment>not</segment><segment>a</segment><segment>runtime</segment><segment>proof.</segment><segment>Traceable</segment><segment>checklist</segment><segment>and</segment><segment>requirement</segment><segment>mapping.</segment><segment>Can</segment><segment>miss</segment><segment>runtime</segment><segment>behavior</segment><segment>if</segment><segment>review</segment><segment>is</segment><segment>document-only.</segment><segment>Requires</segment><segment>versioned</segment><segment>standards</segment><segment>and</segment><segment>mapping</segment><segment>rationale.</segment><segment>Requirements</segment><segment>traceability</segment><segment>and</segment><segment>secure-</segment><segment>development</segment><segment>governance.</segment><segment>5.</segment><segment>Results</segment><segment>and</segment><segment>Analytical</segment><segment>Outputs</segment><segment>5.1</segment><segment>Thematic</segment><segment>Findings</segment><segment>The</segment><segment>synthesis</segment><segment>produced</segment><segment>four</segment><segment>thematic</segment><segment>findings.</segment><segment>First,</segment><segment>access-control</segment><segment>failures</segment><segment>are</segment><segment>semantic</segment><segment>vulnerabilities:</segment><segment>whether</segment><segment>a</segment><segment>request</segment><segment>is</segment><segment>secure</segment><segment>depends</segment><segment>on</segment><segment>who</segment><segment>sends</segment><segment>it,</segment><segment>what</segment><segment>object</segment><segment>is</segment><segment>targeted,</segment><segment>what</segment><segment>session</segment><segment>state</segment><segment>exists,</segment><segment>and</segment><segment>what</segment><segment>workflow</segment><segment>state</segment><segment>applies.</segment><segment>Second,</segment><segment>automated</segment><segment>scanners</segment><segment>can</segment><segment>provide</segment><segment>valuable</segment><segment>coverage</segment><segment>but</segment><segment>may</segment><segment>struggle</segment><segment>with</segment><segment>multi-user</segment><segment>authorization,</segment><segment>object</segment><segment>ownership,</segment><segment>and</segment><segment>business</segment><segment>process</segment><segment>semantics</segment><segment>unless</segment><segment>state</segment><segment>and</segment><segment>credentials</segment><segment>are</segment><segment>explicitly</segment><segment>modeled.</segment><segment>Third,</segment><segment>standards</segment><segment>provide</segment><segment>strong</segment><segment>control</segment><segment>expectations,</segment><segment>but</segment><segment>additional</segment><segment>benchmark</segment><segment>documentation</segment><segment>is</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>24</segment><segment>needed</segment><segment>to</segment><segment>turn</segment><segment>those</segment><segment>expectations</segment><segment>into</segment><segment>reproducible</segment><segment>test</segment><segment>cases.</segment><segment>Fourth,</segment><segment>AI-assisted</segment><segment>testing</segment><segment>can</segment><segment>support</segment><segment>security</segment><segment>reasoning,</segment><segment>but</segment><segment>it</segment><segment>requires</segment><segment>structured</segment><segment>task</segment><segment>definitions</segment><segment>and</segment><segment>evidence</segment><segment>constraints</segment><segment>to</segment><segment>avoid</segment><segment>plausible</segment><segment>but</segment><segment>unsupported</segment><segment>conclusions.</segment><segment>5.2</segment><segment>Gap</segment><segment>Mapping</segment><segment>The</segment><segment>gap</segment><segment>mapping</segment><segment>shows</segment><segment>that</segment><segment>existing</segment><segment>resources</segment><segment>support</segment><segment>parts</segment><segment>of</segment><segment>the</segment><segment>problem</segment><segment>but</segment><segment>not</segment><segment>the</segment><segment>complete</segment><segment>stateful</segment><segment>benchmark</segment><segment>requirement.</segment><segment>OWASP</segment><segment>and</segment><segment>NIST</segment><segment>standards</segment><segment>define</segment><segment>what</segment><segment>secure</segment><segment>behavior</segment><segment>should</segment><segment>look</segment><segment>like.</segment><segment>MITRE</segment><segment>CWE</segment><segment>defines</segment><segment>weakness</segment><segment>families.</segment><segment>OWASP</segment><segment>Benchmark</segment><segment>and</segment><segment>SARD</segment><segment>provide</segment><segment>tool-evaluation</segment><segment>resources.</segment><segment>Access-control</segment><segment>research</segment><segment>proposes</segment><segment>detection</segment><segment>approaches.</segment><segment>AI-security</segment><segment>research</segment><segment>highlights</segment><segment>emerging</segment><segment>automated</segment><segment>reasoning</segment><segment>capabilities.</segment><segment>AuthStateBench</segment><segment>integrates</segment><segment>these</segment><segment>strands</segment><segment>by</segment><segment>representing</segment><segment>each</segment><segment>benchmark</segment><segment>scenario</segment><segment>as</segment><segment>a</segment><segment>stateful</segment><segment>policy</segment><segment>test</segment><segment>with</segment><segment>traceable</segment><segment>standards</segment><segment>mapping.</segment><segment>5.3</segment><segment>Framework</segment><segment>or</segment><segment>Benchmark</segment><segment>Outputs</segment><segment>The</segment><segment>primary</segment><segment>benchmark</segment><segment>outputs</segment><segment>are</segment><segment>the</segment><segment>scenario</segment><segment>taxonomy,</segment><segment>the</segment><segment>state</segment><segment>matrix,</segment><segment>the</segment><segment>standards</segment><segment>mapping,</segment><segment>and</segment><segment>the</segment><segment>scenario</segment><segment>template</segment><segment>presented</segment><segment>in</segment><segment>Tables</segment><segment>4-7.</segment><segment>These</segment><segment>outputs</segment><segment>allow</segment><segment>a</segment><segment>future</segment><segment>benchmark</segment><segment>implementation</segment><segment>to</segment><segment>include</segment><segment>representative</segment><segment>scenario</segment><segment>families</segment><segment>rather</segment><segment>than</segment><segment>isolated</segment><segment>examples.</segment><segment>For</segment><segment>instance,</segment><segment>an</segment><segment>object-level</segment><segment>authorization</segment><segment>scenario</segment><segment>can</segment><segment>be</segment><segment>instantiated</segment><segment>with</segment><segment>different</segment><segment>combinations</segment><segment>of</segment><segment>roles,</segment><segment>tenants,</segment><segment>session</segment><segment>states,</segment><segment>and</segment><segment>object-sharing</segment><segment>rules.</segment><segment>A</segment><segment>workflow</segment><segment>bypass</segment><segment>scenario</segment><segment>can</segment><segment>be</segment><segment>instantiated</segment><segment>with</segment><segment>skipped</segment><segment>approval,</segment><segment>repeated</segment><segment>confirmation,</segment><segment>forced</segment><segment>endpoint</segment><segment>access,</segment><segment>or</segment><segment>post-rollback</segment><segment>actions.</segment><segment>This</segment><segment>modular</segment><segment>design</segment><segment>supports</segment><segment>expansion</segment><segment>while</segment><segment>preserving</segment><segment>consistent</segment><segment>documentation.</segment><segment>5.4</segment><segment>Standards</segment><segment>Alignment</segment><segment>AuthStateBench</segment><segment>aligns</segment><segment>with</segment><segment>standards</segment><segment>at</segment><segment>three</segment><segment>levels.</segment><segment>At</segment><segment>the</segment><segment>risk-taxonomy</segment><segment>level,</segment><segment>it</segment><segment>maps</segment><segment>to</segment><segment>OWASP</segment><segment>Top</segment><segment>10:2025</segment><segment>and</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10:2023</segment><segment>[1]-[4].</segment><segment>At</segment><segment>the</segment><segment>verification</segment><segment>level,</segment><segment>it</segment><segment>maps</segment><segment>to</segment><segment>OWASP</segment><segment>ASVS</segment><segment>5.0.0</segment><segment>and</segment><segment>WSTG</segment><segment>testing</segment><segment>concerns</segment><segment>[5],</segment><segment>[6].</segment><segment>At</segment><segment>the</segment><segment>secure-</segment><segment>development</segment><segment>and</segment><segment>weakness-classification</segment><segment>level,</segment><segment>it</segment><segment>maps</segment><segment>to</segment><segment>NIST</segment><segment>SSDF,</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>guidance,</segment><segment>and</segment><segment>MITRE</segment><segment>CWE</segment><segment>categories</segment><segment>[8],</segment><segment>[12]-[20].</segment><segment>Identity-protocol</segment><segment>references</segment><segment>such</segment><segment>as</segment><segment>OAuth</segment><segment>2.0</segment><segment>Security</segment><segment>BCP</segment><segment>and</segment><segment>OpenID</segment><segment>Connect</segment><segment>support</segment><segment>token,</segment><segment>authentication,</segment><segment>and</segment><segment>session</segment><segment>lifecycle</segment><segment>scenarios</segment><segment>[21]-[23].</segment><segment>reviews,</segment><segment>AuthStateBench</segment><segment>adds</segment><segment>5.5</segment><segment>Comparison</segment><segment>with</segment><segment>Existing</segment><segment>Approaches</segment><segment>scenario-level</segment><segment>Compared</segment><segment>with</segment><segment>generic</segment><segment>OWASP</segment><segment>reproducibility.</segment><segment>Compared</segment><segment>with</segment><segment>scanner</segment><segment>evaluations,</segment><segment>it</segment><segment>documents</segment><segment>state</segment><segment>conditions</segment><segment>that</segment><segment>tools</segment><segment>must</segment><segment>handle</segment><segment>or</segment><segment>be</segment><segment>given.</segment><segment>Compared</segment><segment>with</segment><segment>code-level</segment><segment>vulnerability</segment><segment>datasets,</segment><segment>it</segment><segment>emphasizes</segment><segment>policy</segment><segment>semantics</segment><segment>and</segment><segment>multi-step</segment><segment>workflows.</segment><segment>Compared</segment><segment>with</segment><segment>AI-security</segment><segment>benchmarks,</segment><segment>it</segment><segment>provides</segment><segment>domain-specific</segment><segment>scenario</segment><segment>templates</segment><segment>for</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>reasoning.</segment><segment>It</segment><segment>therefore</segment><segment>does</segment><segment>not</segment><segment>replace</segment><segment>existing</segment><segment>benchmarks</segment><segment>or</segment><segment>standards;</segment><segment>it</segment><segment>complements</segment><segment>them</segment><segment>by</segment><segment>filling</segment><segment>a</segment><segment>stateful</segment><segment>scenario-design</segment><segment>gap.</segment><segment>Table</segment><segment>9.</segment><segment>Research</segment><segment>gap</segment><segment>matrix.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Existing</segment><segment>resource</segment><segment>OWASP</segment><segment>Top</segment><segment>10</segment><segment>/</segment><segment>API</segment><segment>Top</segment><segment>10</segment><segment>What</segment><segment>it</segment><segment>provides</segment><segment>Gap</segment><segment>for</segment><segment>stateful</segment><segment>Risk</segment><segment>categories</segment><segment>for</segment><segment>web</segment><segment>and</segment><segment>API</segment><segment>security.</segment><segment>authorization/authentication</segment><segment>Risk</segment><segment>category</segment><segment>does</segment><segment>not</segment><segment>by</segment><segment>itself</segment><segment>specify</segment><segment>role,</segment><segment>session,</segment><segment>object,</segment><segment>and</segment><segment>workflow</segment><segment>preconditions.</segment><segment>Requirements</segment><segment>need</segment><segment>benchmark-ready</segment><segment>scenario</segment><segment>fields</segment><segment>for</segment><segment>comparison</segment><segment>studies.</segment><segment>Guidance</segment><segment>is</segment><segment>broad</segment><segment>and</segment><segment>not</segment><segment>a</segment><segment>vulnerability</segment><segment>test-case</segment><segment>benchmark.</segment><segment>CWE</segment><segment>IDs</segment><segment>alone</segment><segment>do</segment><segment>not</segment><segment>define</segment><segment>multi-user</segment><segment>workflow</segment><segment>conditions.</segment><segment>Less</segment><segment>focused</segment><segment>on</segment><segment>multi-step</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>semantics.</segment><segment>May</segment><segment>not</segment><segment>isolate</segment><segment>authorization</segment><segment>workflow</segment><segment>reasoning</segment><segment>from</segment><segment>exploit</segment><segment>execution.</segment><segment>Page</segment><segment>25</segment><segment>AuthStateBench</segment><segment>response</segment><segment>Converts</segment><segment>risk</segment><segment>categories</segment><segment>into</segment><segment>scenario</segment><segment>classes.</segment><segment>Maps</segment><segment>scenarios</segment><segment>to</segment><segment>requirements</segment><segment>and</segment><segment>evidence</segment><segment>expectations.</segment><segment>Links</segment><segment>benchmark</segment><segment>scenarios</segment><segment>to</segment><segment>secure-</segment><segment>development</segment><segment>and</segment><segment>validation</segment><segment>activities.</segment><segment>Uses</segment><segment>CWE</segment><segment>as</segment><segment>traceability,</segment><segment>not</segment><segment>as</segment><segment>the</segment><segment>entire</segment><segment>scenario</segment><segment>definition.</segment><segment>Adds</segment><segment>stateful</segment><segment>scenario</segment><segment>design</segment><segment>for</segment><segment>auth/access-control</segment><segment>cases.</segment><segment>Defines</segment><segment>structured</segment><segment>tasks</segment><segment>for</segment><segment>future</segment><segment>AI-</segment><segment>assisted</segment><segment>testing</segment><segment>comparison.</segment><segment>OWASP</segment><segment>ASVS</segment><segment>/</segment><segment>WSTG</segment><segment>Verification</segment><segment>and</segment><segment>testing</segment><segment>guidance.</segment><segment>NIST</segment><segment>SSDF</segment><segment>/</segment><segment>CISA</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>MITRE</segment><segment>CWE</segment><segment>Secure-</segment><segment>development</segment><segment>governance</segment><segment>and</segment><segment>product-security</segment><segment>principles.</segment><segment>Weakness</segment><segment>family</segment><segment>taxonomy.</segment><segment>OWASP</segment><segment>Benchmark</segment><segment>/</segment><segment>SARD</segment><segment>/</segment><segment>Juliet</segment><segment>Repeatable</segment><segment>test</segment><segment>cases</segment><segment>for</segment><segment>tool</segment><segment>evaluation.</segment><segment>AI</segment><segment>vulnerability</segment><segment>benchmarks</segment><segment>Evaluate</segment><segment>AI</segment><segment>or</segment><segment>agentic</segment><segment>security</segment><segment>capabilities.</segment><segment>Table</segment><segment>10.</segment><segment>Future</segment><segment>validation</segment><segment>and</segment><segment>research</segment><segment>roadmap.</segment><segment>Stage</segment><segment>Purpose</segment><segment>Stage</segment><segment>1:</segment><segment>standards</segment><segment>alignment</segment><segment>review</segment><segment>Check</segment><segment>whether</segment><segment>mappings</segment><segment>are</segment><segment>accurate</segment><segment>and</segment><segment>complete.</segment><segment>Stage</segment><segment>2:</segment><segment>expert</segment><segment>Assess</segment><segment>practical</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>Recommended</segment><segment>activity</segment><segment>Compare</segment><segment>each</segment><segment>scenario</segment><segment>class</segment><segment>with</segment><segment>OWASP,</segment><segment>ASVS,</segment><segment>WSTG,</segment><segment>NIST,</segment><segment>CISA,</segment><segment>MITRE,</segment><segment>OAuth,</segment><segment>and</segment><segment>OpenID</segment><segment>sources.</segment><segment>Invite</segment><segment>3-5</segment><segment>Expected</segment><segment>output</segment><segment>Validated</segment><segment>mapping</segment><segment>table</segment><segment>and</segment><segment>revised</segment><segment>scenario</segment><segment>definitions.</segment><segment>Expert</segment><segment>feedback</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>26</segment><segment>matrix</segment><segment>and</segment><segment>updated</segment><segment>taxonomy.</segment><segment>Runnable</segment><segment>benchmark</segment><segment>prototype</segment><segment>and</segment><segment>ground-truth</segment><segment>labels.</segment><segment>Comparative</segment><segment>evaluation</segment><segment>results</segment><segment>with</segment><segment>transparent</segment><segment>limitations.</segment><segment>Versioned</segment><segment>public</segment><segment>benchmark</segment><segment>artifact.</segment><segment>review</segment><segment>realism</segment><segment>and</segment><segment>clarity.</segment><segment>Turn</segment><segment>abstract</segment><segment>scenarios</segment><segment>into</segment><segment>local</segment><segment>vulnerable</segment><segment>applications.</segment><segment>Evaluate</segment><segment>manual,</segment><segment>scanner-assisted,</segment><segment>AI-</segment><segment>assisted,</segment><segment>and</segment><segment>standards-based</segment><segment>approaches.</segment><segment>Enable</segment><segment>reuse</segment><segment>and</segment><segment>replication.</segment><segment>Stage</segment><segment>3:</segment><segment>controlled</segment><segment>implementation</segment><segment>Stage</segment><segment>4:</segment><segment>method</segment><segment>comparison</segment><segment>Stage</segment><segment>5:</segment><segment>public</segment><segment>release</segment><segment>6.</segment><segment>Discussion</segment><segment>application-security</segment><segment>academics,</segment><segment>penetration</segment><segment>testers,</segment><segment>or</segment><segment>secure</segment><segment>software</segment><segment>engineers.</segment><segment>Implement</segment><segment>representative</segment><segment>scenarios</segment><segment>in</segment><segment>a</segment><segment>testbed</segment><segment>with</segment><segment>documented</segment><segment>accounts</segment><segment>and</segment><segment>workflows.</segment><segment>Run</segment><segment>controlled</segment><segment>tests</segment><segment>without</segment><segment>live</segment><segment>targets</segment><segment>and</segment><segment>record</segment><segment>evidence</segment><segment>quality.</segment><segment>Publish</segment><segment>documentation,</segment><segment>templates,</segment><segment>scenario</segment><segment>definitions,</segment><segment>and</segment><segment>implementation</segment><segment>notes.</segment><segment>6.1</segment><segment>Key</segment><segment>Insights</segment><segment>The</segment><segment>first</segment><segment>key</segment><segment>insight</segment><segment>is</segment><segment>that</segment><segment>stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>testing</segment><segment>must</segment><segment>be</segment><segment>framed</segment><segment>as</segment><segment>policy-state</segment><segment>verification</segment><segment>rather</segment><segment>than</segment><segment>payload</segment><segment>detection.</segment><segment>A</segment><segment>payload-centered</segment><segment>view</segment><segment>is</segment><segment>useful</segment><segment>for</segment><segment>injection</segment><segment>and</segment><segment>many</segment><segment>input-driven</segment><segment>flaws,</segment><segment>but</segment><segment>it</segment><segment>is</segment><segment>insufficient</segment><segment>for</segment><segment>understanding</segment><segment>whether</segment><segment>an</segment><segment>authenticated</segment><segment>user</segment><segment>should</segment><segment>access</segment><segment>a</segment><segment>resource,</segment><segment>whether</segment><segment>a</segment><segment>tenant</segment><segment>boundary</segment><segment>should</segment><segment>apply,</segment><segment>or</segment><segment>whether</segment><segment>a</segment><segment>workflow</segment><segment>state</segment><segment>authorizes</segment><segment>an</segment><segment>operation.</segment><segment>The</segment><segment>second</segment><segment>insight</segment><segment>is</segment><segment>that</segment><segment>standards</segment><segment>mapping</segment><segment>improves</segment><segment>benchmark</segment><segment>legitimacy,</segment><segment>but</segment><segment>standards</segment><segment>alone</segment><segment>do</segment><segment>not</segment><segment>create</segment><segment>benchmark</segment><segment>reproducibility.</segment><segment>The</segment><segment>third</segment><segment>insight</segment><segment>is</segment><segment>that</segment><segment>manual,</segment><segment>scanner-assisted,</segment><segment>and</segment><segment>AI-assisted</segment><segment>approaches</segment><segment>should</segment><segment>not</segment><segment>be</segment><segment>treated</segment><segment>as</segment><segment>interchangeable.</segment><segment>Each</segment><segment>has</segment><segment>different</segment><segment>strengths</segment><segment>and</segment><segment>evidence</segment><segment>requirements.</segment><segment>6.2</segment><segment>Cybersecurity</segment><segment>Implications</segment><segment>AuthStateBench</segment><segment>has</segment><segment>implications</segment><segment>for</segment><segment>application-security</segment><segment>research</segment><segment>and</segment><segment>cyber</segment><segment>defense.</segment><segment>For</segment><segment>researchers,</segment><segment>it</segment><segment>provides</segment><segment>a</segment><segment>way</segment><segment>to</segment><segment>define</segment><segment>comparable</segment><segment>tasks</segment><segment>for</segment><segment>access-control</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>testing.</segment><segment>For</segment><segment>tool</segment><segment>builders,</segment><segment>it</segment><segment>clarifies</segment><segment>what</segment><segment>state</segment><segment>information</segment><segment>a</segment><segment>scanner</segment><segment>or</segment><segment>AI-assisted</segment><segment>system</segment><segment>must</segment><segment>handle.</segment><segment>For</segment><segment>defenders,</segment><segment>it</segment><segment>encourages</segment><segment>evidence-based</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>27</segment><segment>assessment</segment><segment>of</segment><segment>whether</segment><segment>authorization</segment><segment>and</segment><segment>session</segment><segment>controls</segment><segment>enforce</segment><segment>server-side</segment><segment>policy</segment><segment>across</segment><segment>realistic</segment><segment>business</segment><segment>states.</segment><segment>For</segment><segment>educators,</segment><segment>it</segment><segment>offers</segment><segment>a</segment><segment>structured</segment><segment>way</segment><segment>to</segment><segment>teach</segment><segment>junior</segment><segment>penetration</segment><segment>testers</segment><segment>why</segment><segment>authentication,</segment><segment>authorization,</segment><segment>session</segment><segment>management,</segment><segment>and</segment><segment>workflow</segment><segment>logic</segment><segment>must</segment><segment>be</segment><segment>tested</segment><segment>together.</segment><segment>6.3</segment><segment>Practical</segment><segment>and</segment><segment>Policy</segment><segment>Implications</segment><segment>In</segment><segment>practice,</segment><segment>the</segment><segment>benchmark</segment><segment>design</segment><segment>can</segment><segment>support</segment><segment>secure</segment><segment>development</segment><segment>lifecycle</segment><segment>activities.</segment><segment>Requirements</segment><segment>engineers</segment><segment>can</segment><segment>use</segment><segment>the</segment><segment>state</segment><segment>matrix</segment><segment>to</segment><segment>document</segment><segment>authorization</segment><segment>rules.</segment><segment>Developers</segment><segment>can</segment><segment>use</segment><segment>scenario</segment><segment>templates</segment><segment>to</segment><segment>write</segment><segment>tests</segment><segment>for</segment><segment>object</segment><segment>ownership</segment><segment>and</segment><segment>workflow</segment><segment>preconditions.</segment><segment>Penetration</segment><segment>testers</segment><segment>can</segment><segment>use</segment><segment>the</segment><segment>taxonomy</segment><segment>to</segment><segment>structure</segment><segment>manual</segment><segment>testing</segment><segment>evidence.</segment><segment>Security</segment><segment>managers</segment><segment>can</segment><segment>map</segment><segment>findings</segment><segment>to</segment><segment>standards</segment><segment>for</segment><segment>reporting</segment><segment>and</segment><segment>remediation</segment><segment>prioritization.</segment><segment>Policy</segment><segment>teams</segment><segment>can</segment><segment>use</segment><segment>the</segment><segment>structure</segment><segment>to</segment><segment>connect</segment><segment>secure-by-design</segment><segment>expectations</segment><segment>with</segment><segment>concrete</segment><segment>verification</segment><segment>evidence.</segment><segment>6.4</segment><segment>Limitations</segment><segment>The</segment><segment>article</segment><segment>has</segment><segment>clear</segment><segment>limitations.</segment><segment>AuthStateBench</segment><segment>is</segment><segment>a</segment><segment>design</segment><segment>artifact,</segment><segment>not</segment><segment>a</segment><segment>completed</segment><segment>empirical</segment><segment>benchmark</segment><segment>implementation.</segment><segment>No</segment><segment>tool</segment><segment>results</segment><segment>are</segment><segment>reported,</segment><segment>and</segment><segment>no</segment><segment>claim</segment><segment>is</segment><segment>made</segment><segment>about</segment><segment>detection</segment><segment>accuracy.</segment><segment>The</segment><segment>taxonomy</segment><segment>may</segment><segment>require</segment><segment>refinement</segment><segment>after</segment><segment>expert</segment><segment>review</segment><segment>and</segment><segment>controlled</segment><segment>implementation.</segment><segment>Some</segment><segment>standards</segment><segment>references</segment><segment>may</segment><segment>evolve,</segment><segment>so</segment><segment>mappings</segment><segment>should</segment><segment>be</segment><segment>versioned.</segment><segment>The</segment><segment>current</segment><segment>design</segment><segment>focuses</segment><segment>on</segment><segment>web</segment><segment>applications</segment><segment>and</segment><segment>APIs</segment><segment>and</segment><segment>may</segment><segment>not</segment><segment>directly</segment><segment>apply</segment><segment>to</segment><segment>mobile,</segment><segment>IoT,</segment><segment>blockchain,</segment><segment>or</segment><segment>low-level</segment><segment>protocol</segment><segment>systems</segment><segment>without</segment><segment>adaptation.</segment><segment>6.5</segment><segment>Future</segment><segment>Research</segment><segment>Roadmap</segment><segment>Future</segment><segment>work</segment><segment>should</segment><segment>proceed</segment><segment>in</segment><segment>five</segment><segment>steps.</segment><segment>First,</segment><segment>an</segment><segment>independent</segment><segment>standards-alignment</segment><segment>review</segment><segment>should</segment><segment>verify</segment><segment>scenario</segment><segment>mappings.</segment><segment>Second,</segment><segment>expert</segment><segment>review</segment><segment>should</segment><segment>assess</segment><segment>practical</segment><segment>realism</segment><segment>and</segment><segment>coverage.</segment><segment>Third,</segment><segment>selected</segment><segment>scenarios</segment><segment>should</segment><segment>be</segment><segment>implemented</segment><segment>in</segment><segment>controlled</segment><segment>vulnerable</segment><segment>web</segment><segment>applications</segment><segment>with</segment><segment>versioned</segment><segment>documentation.</segment><segment>Fourth,</segment><segment>manual,</segment><segment>scanner-assisted,</segment><segment>AI-assisted,</segment><segment>and</segment><segment>standards-based</segment><segment>methods</segment><segment>should</segment><segment>be</segment><segment>compared</segment><segment>using</segment><segment>explicit</segment><segment>evidence</segment><segment>criteria.</segment><segment>Fifth,</segment><segment>the</segment><segment>benchmark</segment><segment>should</segment><segment>be</segment><segment>released</segment><segment>as</segment><segment>a</segment><segment>public</segment><segment>artifact</segment><segment>with</segment><segment>scenario</segment><segment>definitions,</segment><segment>implementation</segment><segment>notes,</segment><segment>ground-truth</segment><segment>labels,</segment><segment>and</segment><segment>clear</segment><segment>ethical-use</segment><segment>guidance.</segment><segment>Fig.</segment><segment>5</segment><segment>converts</segment><segment>the</segment><segment>future-work</segment><segment>discussion</segment><segment>into</segment><segment>a</segment><segment>validation</segment><segment>roadmap.</segment><segment>This</segment><segment>separation</segment><segment>between</segment><segment>design</segment><segment>and</segment><segment>empirical</segment><segment>validation</segment><segment>is</segment><segment>important</segment><segment>because</segment><segment>the</segment><segment>current</segment><segment>article</segment><segment>does</segment><segment>not</segment><segment>claim</segment><segment>scanner</segment><segment>accuracy</segment><segment>or</segment><segment>AI-agent</segment><segment>performance.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>28</segment><segment>Fig.</segment><segment>5.</segment><segment>Future</segment><segment>validation</segment><segment>roadmap</segment><segment>for</segment><segment>turning</segment><segment>AuthStateBench</segment><segment>into</segment><segment>an</segment><segment>empirical</segment><segment>benchmark.</segment><segment>7.</segment><segment>Conclusion</segment><segment>Stateful</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>weaknesses</segment><segment>remain</segment><segment>difficult</segment><segment>to</segment><segment>benchmark</segment><segment>because</segment><segment>their</segment><segment>security</segment><segment>depends</segment><segment>on</segment><segment>role,</segment><segment>session,</segment><segment>object</segment><segment>ownership,</segment><segment>and</segment><segment>workflow</segment><segment>conditions.</segment><segment>Existing</segment><segment>standards</segment><segment>and</segment><segment>benchmarks</segment><segment>provide</segment><segment>valuable</segment><segment>foundations,</segment><segment>but</segment><segment>they</segment><segment>do</segment><segment>not</segment><segment>fully</segment><segment>solve</segment><segment>the</segment><segment>problem</segment><segment>of</segment><segment>scenario-level</segment><segment>reproducibility</segment><segment>for</segment><segment>semantic</segment><segment>access-control</segment><segment>and</segment><segment>authentication</segment><segment>failures.</segment><segment>AuthStateBench</segment><segment>addresses</segment><segment>this</segment><segment>gap</segment><segment>by</segment><segment>proposing</segment><segment>a</segment><segment>standards-aligned</segment><segment>benchmark</segment><segment>design</segment><segment>that</segment><segment>includes</segment><segment>a</segment><segment>four-dimensional</segment><segment>state</segment><segment>model,</segment><segment>scenario</segment><segment>taxonomy,</segment><segment>standards</segment><segment>mapping,</segment><segment>scenario</segment><segment>template,</segment><segment>evaluation</segment><segment>criteria,</segment><segment>and</segment><segment>validation</segment><segment>roadmap.</segment><segment>The</segment><segment>article</segment><segment>deliberately</segment><segment>avoids</segment><segment>unsupported</segment><segment>empirical</segment><segment>claims.</segment><segment>It</segment><segment>does</segment><segment>not</segment><segment>report</segment><segment>scanner</segment><segment>results,</segment><segment>AI-agent</segment><segment>performance,</segment><segment>exploit</segment><segment>success,</segment><segment>or</segment><segment>real-system</segment><segment>testing.</segment><segment>Its</segment><segment>contribution</segment><segment>is</segment><segment>a</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>29</segment><segment>design</segment><segment>framework</segment><segment>that</segment><segment>future</segment><segment>researchers</segment><segment>and</segment><segment>practitioners</segment><segment>can</segment><segment>implement</segment><segment>and</segment><segment>evaluate</segment><segment>transparently.</segment><segment>By</segment><segment>making</segment><segment>stateful</segment><segment>conditions</segment><segment>explicit,</segment><segment>AuthStateBench</segment><segment>can</segment><segment>improve</segment><segment>comparability</segment><segment>in</segment><segment>web</segment><segment>security</segment><segment>testing,</segment><segment>support</segment><segment>secure-development</segment><segment>education,</segment><segment>and</segment><segment>provide</segment><segment>a</segment><segment>foundation</segment><segment>for</segment><segment>more</segment><segment>rigorous</segment><segment>evaluation</segment><segment>of</segment><segment>manual,</segment><segment>scanner-assisted,</segment><segment>AI-assisted,</segment><segment>and</segment><segment>standards-based</segment><segment>approaches</segment><segment>to</segment><segment>authorization</segment><segment>and</segment><segment>authentication</segment><segment>workflow</segment><segment>security.</segment><segment>Declarations</segment><segment>Funding</segment><segment>No</segment><segment>funding</segment><segment>was</segment><segment>received</segment><segment>for</segment><segment>this</segment><segment>work.</segment><segment>Competing</segment><segment>Interests</segment><segment>The</segment><segment>author</segment><segment>declares</segment><segment>no</segment><segment>competing</segment><segment>interests.</segment><segment>Ethics</segment><segment>Approval</segment><segment>Not</segment><segment>applicable.</segment><segment>This</segment><segment>article</segment><segment>is</segment><segment>a</segment><segment>literature-based</segment><segment>and</segment><segment>standards-aligned</segment><segment>benchmark-design</segment><segment>study</segment><segment>and</segment><segment>does</segment><segment>not</segment><segment>involve</segment><segment>human</segment><segment>participants,</segment><segment>personal</segment><segment>data,</segment><segment>live-system</segment><segment>testing,</segment><segment>or</segment><segment>animal</segment><segment>subjects.</segment><segment>Consent</segment><segment>for</segment><segment>Publication</segment><segment>Not</segment><segment>applicable.</segment><segment>Data</segment><segment>Availability</segment><segment>No</segment><segment>empirical</segment><segment>dataset</segment><segment>was</segment><segment>generated</segment><segment>or</segment><segment>analyzed.</segment><segment>The</segment><segment>article</segment><segment>is</segment><segment>based</segment><segment>on</segment><segment>publicly</segment><segment>available</segment><segment>literature,</segment><segment>standards,</segment><segment>and</segment><segment>guidance</segment><segment>sources</segment><segment>cited</segment><segment>in</segment><segment>the</segment><segment>reference</segment><segment>list.</segment><segment>Future</segment><segment>benchmark</segment><segment>scenarios</segment><segment>should</segment><segment>be</segment><segment>released</segment><segment>as</segment><segment>versioned</segment><segment>documentation</segment><segment>if</segment><segment>implemented.</segment><segment>Author</segment><segment>Contributions</segment><segment>Muhammad</segment><segment>Shahzad</segment><segment>Khadim</segment><segment>conceptualized</segment><segment>the</segment><segment>study,</segment><segment>designed</segment><segment>the</segment><segment>methodology,</segment><segment>developed</segment><segment>the</segment><segment>benchmark</segment><segment>model,</segment><segment>and</segment><segment>wrote</segment><segment>the</segment><segment>manuscript.</segment><segment>Syed</segment><segment>Mufassir</segment><segment>Shah</segment><segment>contributed</segment><segment>to</segment><segment>literature</segment><segment>review,</segment><segment>data</segment><segment>organization,</segment><segment>and</segment><segment>manuscript</segment><segment>editing.</segment><segment>Zubair</segment><segment>Khan</segment><segment>assisted</segment><segment>in</segment><segment>validation</segment><segment>design,</segment><segment>formatting,</segment><segment>and</segment><segment>final</segment><segment>proofreading.</segment><segment>Acknowledgements</segment><segment>The</segment><segment>author</segment><segment>acknowledges</segment><segment>the</segment><segment>public</segment><segment>work</segment><segment>of</segment><segment>OWASP,</segment><segment>NIST,</segment><segment>MITRE,</segment><segment>CISA,</segment><segment>FIRST,</segment><segment>IETF,</segment><segment>OpenID</segment><segment>Foundation,</segment><segment>and</segment><segment>the</segment><segment>academic</segment><segment>security</segment><segment>research</segment><segment>community</segment><segment>whose</segment><segment>standards</segment><segment>and</segment><segment>studies</segment><segment>informed</segment><segment>this</segment><segment>conceptual</segment><segment>benchmark</segment><segment>design.</segment><segment>Declaration</segment><segment>of</segment><segment>generative</segment><segment>AI</segment><segment>and</segment><segment>AI-assisted</segment><segment>technologies</segment><segment>in</segment><segment>the</segment><segment>manuscript</segment><segment>preparation</segment><segment>process</segment><segment>During</segment><segment>the</segment><segment>preparation</segment><segment>of</segment><segment>this</segment><segment>work,</segment><segment>the</segment><segment>author</segment><segment>used</segment><segment>ChatGPT</segment><segment>by</segment><segment>OpenAI</segment><segment>to</segment><segment>assist</segment><segment>with</segment><segment>improvement,</segment><segment>clarity</segment><segment>enhancement,</segment><segment>and</segment><segment>manuscript</segment><segment>language</segment><segment>refinement,</segment><segment>formatting</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>30</segment><segment>organization.</segment><segment>After</segment><segment>using</segment><segment>this</segment><segment>tool,</segment><segment>the</segment><segment>author</segment><segment>reviewed</segment><segment>and</segment><segment>edited</segment><segment>the</segment><segment>content</segment><segment>as</segment><segment>needed</segment><segment>and</segment><segment>takes</segment><segment>full</segment><segment>responsibility</segment><segment>for</segment><segment>the</segment><segment>content</segment><segment>of</segment><segment>the</segment><segment>submitted</segment><segment>manuscript.</segment><segment>References</segment><segment>[1]</segment><segment>OWASP</segment><segment>Foundation.</segment><segment>OWASP</segment><segment>Top</segment><segment>Ten</segment><segment>Web</segment><segment>Application</segment><segment>Security</segment><segment>Risks</segment><segment>2025.</segment><segment>OWASP,</segment><segment>2025.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[2]</segment><segment>OWASP</segment><segment>Foundation.</segment><segment>A01:2025</segment><segment>-</segment><segment>Broken</segment><segment>Access</segment><segment>Control.</segment><segment>OWASP</segment><segment>Top</segment><segment>10:2025.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[3]</segment><segment>OWASP</segment><segment>Foundation.</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10</segment><segment>2023.</segment><segment>OWASP,</segment><segment>2023.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[4]</segment><segment>OWASP</segment><segment>Foundation.</segment><segment>API1:2023</segment><segment>-</segment><segment>Broken</segment><segment>Object</segment><segment>Level</segment><segment>Authorization.</segment><segment>OWASP</segment><segment>API</segment><segment>Security</segment><segment>Top</segment><segment>10</segment><segment>2023.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[5]</segment><segment>OWASP</segment><segment>Foundation.</segment><segment>OWASP</segment><segment>Application</segment><segment>Security</segment><segment>Verification</segment><segment>Standard</segment><segment>5.0.0.</segment><segment>OWASP,</segment><segment>2025.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[6]</segment><segment>OWASP</segment><segment>Foundation.</segment><segment>OWASP</segment><segment>Web</segment><segment>Security</segment><segment>Testing</segment><segment>Guide,</segment><segment>latest</segment><segment>release.</segment><segment>OWASP.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[7]</segment><segment>OWASP</segment><segment>Foundation.</segment><segment>OWASP</segment><segment>Benchmark</segment><segment>Project.</segment><segment>OWASP.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[8]</segment><segment>M.</segment><segment>Souppaya,</segment><segment>K.</segment><segment>Scarfone,</segment><segment>and</segment><segment>D.</segment><segment>Dodson.</segment><segment>Secure</segment><segment>Software</segment><segment>Development</segment><segment>Framework</segment><segment>(SSDF)</segment><segment>Version</segment><segment>1.1:</segment><segment>Recommendations</segment><segment>for</segment><segment>Mitigating</segment><segment>the</segment><segment>Risk</segment><segment>of</segment><segment>Software</segment><segment>Vulnerabilities.</segment><segment>NIST</segment><segment>SP</segment><segment>800-218,</segment><segment>2022.</segment><segment>[9]</segment><segment>NIST</segment><segment>SAMATE.</segment><segment>Software</segment><segment>Assurance</segment><segment>Reference</segment><segment>Dataset</segment><segment>(SARD).</segment><segment>National</segment><segment>Institute</segment><segment>of</segment><segment>Standards</segment><segment>and</segment><segment>Technology.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[10]</segment><segment>P.</segment><segment>E.</segment><segment>Black.</segment><segment>The</segment><segment>Software</segment><segment>Assurance</segment><segment>Reference</segment><segment>Dataset.</segment><segment>NIST</segment><segment>Internal</segment><segment>Report</segment><segment>8561,</segment><segment>2025.</segment><segment>[11]</segment><segment>F.</segment><segment>E.</segment><segment>Boland</segment><segment>Jr.</segment><segment>and</segment><segment>P.</segment><segment>E.</segment><segment>Black.</segment><segment>The</segment><segment>Juliet</segment><segment>1.1</segment><segment>C/C++</segment><segment>and</segment><segment>Java</segment><segment>Test</segment><segment>Suite.</segment><segment>National</segment><segment>Institute</segment><segment>of</segment><segment>Standards</segment><segment>and</segment><segment>Technology,</segment><segment>2012.</segment><segment>[12]</segment><segment>MITRE.</segment><segment>CWE-284:</segment><segment>Improper</segment><segment>Access</segment><segment>Control.</segment><segment>Common</segment><segment>Weakness</segment><segment>Enumeration.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[13]</segment><segment>MITRE.</segment><segment>CWE-287:</segment><segment>Improper</segment><segment>Authentication.</segment><segment>Common</segment><segment>Weakness</segment><segment>Enumeration.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[14]</segment><segment>MITRE.</segment><segment>CWE-306:</segment><segment>Missing</segment><segment>Authentication</segment><segment>for</segment><segment>Critical</segment><segment>Function.</segment><segment>Common</segment><segment>Weakness</segment><segment>Enumeration.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[15]</segment><segment>MITRE.</segment><segment>CWE-613:</segment><segment>Insufficient</segment><segment>Session</segment><segment>Expiration.</segment><segment>Common</segment><segment>Weakness</segment><segment>Enumeration.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[16]</segment><segment>MITRE.</segment><segment>CWE-639:</segment><segment>Authorization</segment><segment>Bypass</segment><segment>Through</segment><segment>User-Controlled</segment><segment>Key.</segment><segment>Common</segment><segment>Weakness</segment><segment>Enumeration.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>31</segment><segment>[17]</segment><segment>MITRE.</segment><segment>CWE-862:</segment><segment>Missing</segment><segment>Authorization.</segment><segment>Common</segment><segment>Weakness</segment><segment>Enumeration.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[18]</segment><segment>MITRE.</segment><segment>CWE-863:</segment><segment>Incorrect</segment><segment>Authorization.</segment><segment>Common</segment><segment>Weakness</segment><segment>Enumeration.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[19]</segment><segment>CISA.</segment><segment>Secure</segment><segment>by</segment><segment>Design.</segment><segment>Cybersecurity</segment><segment>and</segment><segment>Infrastructure</segment><segment>Security</segment><segment>Agency.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[20]</segment><segment>CISA</segment><segment>and</segment><segment>international</segment><segment>partners.</segment><segment>Shifting</segment><segment>the</segment><segment>Balance</segment><segment>of</segment><segment>Cybersecurity</segment><segment>Risk:</segment><segment>Principles</segment><segment>and</segment><segment>Approaches</segment><segment>for</segment><segment>Secure</segment><segment>by</segment><segment>Design</segment><segment>Software,</segment><segment>2023.</segment><segment>[21]</segment><segment>T.</segment><segment>Lodderstedt,</segment><segment>J.</segment><segment>Bradley,</segment><segment>A.</segment><segment>Labunets,</segment><segment>and</segment><segment>D.</segment><segment>Fett.</segment><segment>Best</segment><segment>Current</segment><segment>Practice</segment><segment>for</segment><segment>OAuth</segment><segment>2.0</segment><segment>Security.</segment><segment>RFC</segment><segment>9700,</segment><segment>BCP</segment><segment>240,</segment><segment>RFC</segment><segment>Editor,</segment><segment>2025.</segment><segment>doi:10.17487/RFC9700.</segment><segment>[22]</segment><segment>N.</segment><segment>Sakimura,</segment><segment>J.</segment><segment>Bradley,</segment><segment>M.</segment><segment>Jones,</segment><segment>B.</segment><segment>de</segment><segment>Medeiros,</segment><segment>and</segment><segment>C.</segment><segment>Mortimore.</segment><segment>OpenID</segment><segment>Connect</segment><segment>Core</segment><segment>1.0</segment><segment>incorporating</segment><segment>errata</segment><segment>set</segment><segment>2.</segment><segment>OpenID</segment><segment>Foundation.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[23]</segment><segment>OpenID</segment><segment>Foundation.</segment><segment>OpenID</segment><segment>Connect</segment><segment>Session</segment><segment>Management</segment><segment>1.0.</segment><segment>Final</segment><segment>specification,</segment><segment>2022.</segment><segment>[24]</segment><segment>FIRST.</segment><segment>Common</segment><segment>Vulnerability</segment><segment>Scoring</segment><segment>System</segment><segment>Version</segment><segment>4.0:</segment><segment>Specification</segment><segment>Document.</segment><segment>Forum</segment><segment>of</segment><segment>Incident</segment><segment>Response</segment><segment>and</segment><segment>Security</segment><segment>Teams.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[25]</segment><segment>FIRST.</segment><segment>Exploit</segment><segment>Prediction</segment><segment>Scoring</segment><segment>System</segment><segment>(EPSS).</segment><segment>Forum</segment><segment>of</segment><segment>Incident</segment><segment>Response</segment><segment>and</segment><segment>Security</segment><segment>Teams.</segment><segment>Accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>[26]</segment><segment>M.</segment><segment>Rennhard,</segment><segment>et</segment><segment>al.</segment><segment>Automating</segment><segment>the</segment><segment>Detection</segment><segment>of</segment><segment>Access</segment><segment>Control</segment><segment>Vulnerabilities</segment><segment>in</segment><segment>Web</segment><segment>Applications.</segment><segment>SN</segment><segment>Computer</segment><segment>Science,</segment><segment>2022.</segment><segment>[27]</segment><segment>L.</segment><segment>Zhong,</segment><segment>et</segment><segment>al.</segment><segment>A</segment><segment>Survey</segment><segment>of</segment><segment>Prevent</segment><segment>and</segment><segment>Detect</segment><segment>Access</segment><segment>Control</segment><segment>Vulnerabilities</segment><segment>in</segment><segment>Web</segment><segment>Applications.</segment><segment>arXiv</segment><segment>preprint</segment><segment>arXiv:2304.10600,</segment><segment>2023.</segment><segment>[28]</segment><segment>F.</segment><segment>Liu,</segment><segment>et</segment><segment>al.</segment><segment>BACScan:</segment><segment>Automatic</segment><segment>Black-Box</segment><segment>Detection</segment><segment>of</segment><segment>Broken</segment><segment>Access-Control</segment><segment>Vulnerabilities.</segment><segment>ACM</segment><segment>CCS,</segment><segment>2025.</segment><segment>[29]</segment><segment>F.</segment><segment>Sun,</segment><segment>L.</segment><segment>Xu,</segment><segment>and</segment><segment>Z.</segment><segment>Su.</segment><segment>Static</segment><segment>Detection</segment><segment>of</segment><segment>Access</segment><segment>Control</segment><segment>Vulnerabilities</segment><segment>in</segment><segment>Web</segment><segment>Applications.</segment><segment>USENIX</segment><segment>Security</segment><segment>Symposium,</segment><segment>2011.</segment><segment>[30]</segment><segment>X.</segment><segment>Li</segment><segment>and</segment><segment>Y.</segment><segment>Xue.</segment><segment>BLOCK:</segment><segment>A</segment><segment>Black-box</segment><segment>Approach</segment><segment>for</segment><segment>Detection</segment><segment>of</segment><segment>State</segment><segment>Violation</segment><segment>Attacks</segment><segment>Towards</segment><segment>Web</segment><segment>Applications.</segment><segment>ACSAC,</segment><segment>2011.</segment><segment>[31]</segment><segment>V.</segment><segment>Felmetsger,</segment><segment>L.</segment><segment>Cavedon,</segment><segment>C.</segment><segment>Kruegel,</segment><segment>and</segment><segment>G.</segment><segment>Vigna.</segment><segment>Toward</segment><segment>Automated</segment><segment>Detection</segment><segment>of</segment><segment>Logic</segment><segment>Vulnerabilities</segment><segment>in</segment><segment>Web</segment><segment>Applications.</segment><segment>USENIX</segment><segment>Security</segment><segment>Symposium,</segment><segment>2010.</segment><segment>[32]</segment><segment>G.</segment><segment>Pellegrino</segment><segment>and</segment><segment>D.</segment><segment>Balzarotti.</segment><segment>Toward</segment><segment>Black-Box</segment><segment>Detection</segment><segment>of</segment><segment>Logic</segment><segment>Flaws</segment><segment>in</segment><segment>Web</segment><segment>Applications.</segment><segment>Network</segment><segment>and</segment><segment>Distributed</segment><segment>System</segment><segment>Security</segment><segment>Symposium,</segment><segment>2014.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>32</segment><segment>[33]</segment><segment>P.</segment><segment>P.</segment><segment>S.</segment><segment>Bisht,</segment><segment>T.</segment><segment>Hinrichs,</segment><segment>N.</segment><segment>Skrupsky,</segment><segment>R.</segment><segment>Bobrowicz,</segment><segment>and</segment><segment>V.</segment><segment>N.</segment><segment>Venkatakrishnan.</segment><segment>NoTamper:</segment><segment>Automatic</segment><segment>Blackbox</segment><segment>Detection</segment><segment>of</segment><segment>Parameter</segment><segment>Tampering</segment><segment>Opportunities</segment><segment>in</segment><segment>Web</segment><segment>Applications.</segment><segment>ACM</segment><segment>CCS,</segment><segment>2010.</segment><segment>[34]</segment><segment>X.</segment><segment>Li,</segment><segment>Y.</segment><segment>Xue,</segment><segment>and</segment><segment>M.</segment><segment>Chu.</segment><segment>Automated</segment><segment>Black-Box</segment><segment>Detection</segment><segment>of</segment><segment>Access</segment><segment>Control</segment><segment>Vulnerabilities</segment><segment>in</segment><segment>Web</segment><segment>Applications.</segment><segment>SACMAT,</segment><segment>2014.</segment><segment>[35]</segment><segment>A.</segment><segment>Borcherding,</segment><segment>et</segment><segment>al.</segment><segment>SWaTEval:</segment><segment>An</segment><segment>Evaluation</segment><segment>Framework</segment><segment>for</segment><segment>Stateful</segment><segment>Web</segment><segment>Application</segment><segment>Testing.</segment><segment>Information</segment><segment>Systems</segment><segment>and</segment><segment>Technologies,</segment><segment>2023.</segment><segment>International</segment><segment>Conference</segment><segment>on</segment><segment>Web</segment><segment>[36]</segment><segment>R.</segment><segment>Natella,</segment><segment>et</segment><segment>al.</segment><segment>ProFuzzBench:</segment><segment>A</segment><segment>Benchmark</segment><segment>for</segment><segment>Stateful</segment><segment>Protocol</segment><segment>Fuzzing.</segment><segment>ACM</segment><segment>ISSTA,</segment><segment>2021.</segment><segment>[37]</segment><segment>E.</segment><segment>Fong,</segment><segment>V.</segment><segment>Okun,</segment><segment>and</segment><segment>R.</segment><segment>Gaucher.</segment><segment>Web</segment><segment>Application</segment><segment>Scanners:</segment><segment>Definitions</segment><segment>and</segment><segment>Functions.</segment><segment>NIST</segment><segment>SAMATE,</segment><segment>2007.</segment><segment>[38]</segment><segment>P.</segment><segment>Nunes,</segment><segment>J.</segment><segment>Fonseca,</segment><segment>and</segment><segment>M.</segment><segment>Vieira.</segment><segment>Benchmarking</segment><segment>Static</segment><segment>Analysis</segment><segment>Tools</segment><segment>for</segment><segment>Web</segment><segment>Security.</segment><segment>IEEE</segment><segment>Transactions</segment><segment>on</segment><segment>Reliability,</segment><segment>2018.</segment><segment>[39]</segment><segment>M.</segment><segment>Miltenberger,</segment><segment>et</segment><segment>al.</segment><segment>Benchmarking</segment><segment>the</segment><segment>Benchmarks.</segment><segment>ACM,</segment><segment>2023.</segment><segment>[40]</segment><segment>N.</segment><segment>Risse,</segment><segment>et</segment><segment>al.</segment><segment>On</segment><segment>Benchmarking</segment><segment>in</segment><segment>Machine</segment><segment>Learning</segment><segment>for</segment><segment>Vulnerability</segment><segment>Detection.</segment><segment>ISSTA,</segment><segment>2025.</segment><segment>[41]</segment><segment>H.</segment><segment>Xu,</segment><segment>S.</segment><segment>Wang,</segment><segment>N.</segment><segment>Li,</segment><segment>K.</segment><segment>Wang,</segment><segment>Y.</segment><segment>Zhao,</segment><segment>K.</segment><segment>Chen,</segment><segment>T.</segment><segment>Yu,</segment><segment>Y.</segment><segment>Liu,</segment><segment>and</segment><segment>H.</segment><segment>Wang.</segment><segment>Large</segment><segment>Language</segment><segment>Models</segment><segment>for</segment><segment>Cyber</segment><segment>Security:</segment><segment>A</segment><segment>Systematic</segment><segment>Literature</segment><segment>Review.</segment><segment>arXiv:2405.04760,</segment><segment>2024.</segment><segment>[42]</segment><segment>S.</segment><segment>M.</segment><segment>Taghavi</segment><segment>Far,</segment><segment>et</segment><segment>al.</segment><segment>Large</segment><segment>Language</segment><segment>Models</segment><segment>for</segment><segment>Software</segment><segment>Vulnerability</segment><segment>Detection.</segment><segment>International</segment><segment>Journal</segment><segment>of</segment><segment>Information</segment><segment>Security,</segment><segment>2025.</segment><segment>[43]</segment><segment>Y.</segment><segment>Chen,</segment><segment>et</segment><segment>al.</segment><segment>A</segment><segment>Survey</segment><segment>of</segment><segment>Large</segment><segment>Language</segment><segment>Models</segment><segment>for</segment><segment>Cyber</segment><segment>Threat</segment><segment>Detection.</segment><segment>Computers</segment><segment>&amp;</segment><segment>Security,</segment><segment>2024.</segment><segment>[44]</segment><segment>Y.</segment><segment>Zhu,</segment><segment>A.</segment><segment>Kellermann,</segment><segment>D.</segment><segment>Bowman,</segment><segment>P.</segment><segment>Li,</segment><segment>A.</segment><segment>Gupta,</segment><segment>A.</segment><segment>Danda,</segment><segment>R.</segment><segment>Fang,</segment><segment>C.</segment><segment>Jensen,</segment><segment>E.</segment><segment>Ihli,</segment><segment>J.</segment><segment>Benn,</segment><segment>et</segment><segment>al.</segment><segment>CVE-Bench:</segment><segment>A</segment><segment>Benchmark</segment><segment>for</segment><segment>AI</segment><segment>Agents'</segment><segment>Ability</segment><segment>to</segment><segment>Exploit</segment><segment>Real-World</segment><segment>Web</segment><segment>Application</segment><segment>Vulnerabilities.</segment><segment>ICML,</segment><segment>2025.</segment><segment>[45]</segment><segment>R.</segment><segment>Fang,</segment><segment>et</segment><segment>al.</segment><segment>Cybench:</segment><segment>A</segment><segment>Framework</segment><segment>for</segment><segment>Evaluating</segment><segment>Cybersecurity</segment><segment>Capabilities</segment><segment>and</segment><segment>Risks</segment><segment>of</segment><segment>Language</segment><segment>Models.</segment><segment>arXiv:2408.08926,</segment><segment>2024.</segment><segment>[46]</segment><segment>M.</segment><segment>Malkawi</segment><segment>and</segment><segment>R.</segment><segment>Alhajj.</segment><segment>AI-Powered</segment><segment>Vulnerability</segment><segment>Detection</segment><segment>and</segment><segment>Patch</segment><segment>Management</segment><segment>in</segment><segment>Cybersecurity:</segment><segment>A</segment><segment>Systematic</segment><segment>Review</segment><segment>of</segment><segment>Techniques,</segment><segment>Challenges,</segment><segment>and</segment><segment>Emerging</segment><segment>Trends.</segment><segment>Machine</segment><segment>Learning</segment><segment>and</segment><segment>Knowledge</segment><segment>Extraction,</segment><segment>vol.</segment><segment>8,</segment><segment>no.</segment><segment>1,</segment><segment>Article</segment><segment>19,</segment><segment>2026.</segment><segment>doi:10.3390/make8010019.</segment><segment>[47]</segment><segment>ISO/IEC.</segment><segment>ISO/IEC</segment><segment>27034-1:2011,</segment><segment>Information</segment><segment>technology</segment><segment>-</segment><segment>Security</segment><segment>techniques</segment><segment>-</segment><segment>Application</segment><segment>security</segment><segment>-</segment><segment>Part</segment><segment>1:</segment><segment>Overview</segment><segment>and</segment><segment>concepts.</segment><segment>International</segment><segment>Organization</segment><segment>for</segment><segment>Standardization,</segment><segment>2011.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment><segment>G.</segment><segment>2076</segment><segment>Page</segment><segment>33</segment><segment>[48]</segment><segment>ISO/IEC/IEEE.</segment><segment>ISO/IEC/IEEE</segment><segment>29119-1:2022,</segment><segment>Software</segment><segment>and</segment><segment>systems</segment><segment>engineering</segment><segment>-</segment><segment>Software</segment><segment>testing</segment><segment>-</segment><segment>Part</segment><segment>1:</segment><segment>General</segment><segment>concepts.</segment><segment>International</segment><segment>Organization</segment><segment>for</segment><segment>Standardization,</segment><segment>2022.</segment><segment>[49]</segment><segment>NIST.</segment><segment>Digital</segment><segment>Identity</segment><segment>Guidelines:</segment><segment>Authentication</segment><segment>and</segment><segment>Lifecycle</segment><segment>Management,</segment><segment>SP</segment><segment>800-</segment><segment>63B.</segment><segment>National</segment><segment>Institute</segment><segment>of</segment><segment>Standards</segment><segment>and</segment><segment>Technology,</segment><segment>latest</segment><segment>available</segment><segment>revision</segment><segment>accessed</segment><segment>27</segment><segment>April</segment><segment>2026.</segment><segment>GRJNST,</segment><segment>Volume:</segment><segment>04</segment><segment>-</segment><segment>Issue</segment><segment>2</segment><segment>(2026)</segment><segment>/</segment><segment>ISSN</segment><segment>P:</segment><segment>2790-7643</segment><segment>Article</segment><segment>ID:</segment><segment>2076</segment><segment>https://doi.org/10.53762/grjnst.04.02.27</segment></root>