{"$schema":"https://policywindow.org/critique/api/schema","name":"Critical AI — critique calibration","description":"How close Critical AI's per-paper critiques are to the published human-expert standard. Each critique is compared, on a shared dimension vocabulary, against the benchmark corpus of real Comments/replications/reanalyses: dimensional alignment (does it attend to the lenses experts emphasise), breadth vs the human range, and the credibility gates the benchmarks embody (sourced, severity-disciplined, claims-not-motives). All re-derived in-app from the corpus + the critiques.","docs":"https://policywindow.org/critique/benchmarks","alignment_threshold":0.8,"reference":{"n":68,"frequency":{"methods":0.9117647058823529,"identification":0.36764705882352944,"statistics":0.7205882352941176,"data_code":0.25,"claims":0.9117647058823529,"reproducibility":0.5735294117647058,"overclaiming":0.45588235294117646,"generalisation":0.4411764705882353,"theory":0.16176470588235295,"novelty":0.04411764705882353},"breadth":{"min":3,"q1":4,"median":5,"q3":5,"max":6,"mean":4.84}},"domain_profiles":[{"domain":"economics","label":"Economics & finance","reference":{"n":14,"frequency":{"methods":0.9285714285714286,"identification":0.5714285714285714,"statistics":0.8571428571428571,"data_code":0.42857142857142855,"claims":0.9285714285714286,"reproducibility":0.7142857142857143,"overclaiming":0.21428571428571427,"generalisation":0.14285714285714285,"theory":0.07142857142857142,"novelty":0},"breadth":{"min":4,"q1":4,"median":5,"q3":5.75,"max":6,"mean":4.86}},"topDimensions":[{"dimension":"methods","frequency":0.9285714285714286},{"dimension":"claims","frequency":0.9285714285714286},{"dimension":"statistics","frequency":0.8571428571428571},{"dimension":"reproducibility","frequency":0.7142857142857143}]},{"domain":"political_science","label":"Political science","reference":{"n":9,"frequency":{"methods":0.7777777777777778,"identification":0.4444444444444444,"statistics":0.8888888888888888,"data_code":0.5555555555555556,"claims":0.7777777777777778,"reproducibility":0.7777777777777778,"overclaiming":0.5555555555555556,"generalisation":0.3333333333333333,"theory":0.1111111111111111,"novelty":0.1111111111111111},"breadth":{"min":5,"q1":5,"median":5,"q3":6,"max":6,"mean":5.33}},"topDimensions":[{"dimension":"statistics","frequency":0.8888888888888888},{"dimension":"methods","frequency":0.7777777777777778},{"dimension":"claims","frequency":0.7777777777777778},{"dimension":"reproducibility","frequency":0.7777777777777778}]},{"domain":"psychology","label":"Psychology","reference":{"n":7,"frequency":{"methods":1,"identification":0.14285714285714285,"statistics":1,"data_code":0,"claims":1,"reproducibility":1,"overclaiming":0.14285714285714285,"generalisation":0.42857142857142855,"theory":0.14285714285714285,"novelty":0},"breadth":{"min":4,"q1":4.5,"median":5,"q3":5,"max":6,"mean":4.86}},"topDimensions":[{"dimension":"methods","frequency":1},{"dimension":"statistics","frequency":1},{"dimension":"claims","frequency":1},{"dimension":"reproducibility","frequency":1}]},{"domain":"sociology","label":"Sociology","reference":{"n":6,"frequency":{"methods":1,"identification":0.3333333333333333,"statistics":0.6666666666666666,"data_code":0.3333333333333333,"claims":1,"reproducibility":0.6666666666666666,"overclaiming":0.5,"generalisation":0.3333333333333333,"theory":0.3333333333333333,"novelty":0},"breadth":{"min":5,"q1":5,"median":5,"q3":5,"max":6,"mean":5.17}},"topDimensions":[{"dimension":"methods","frequency":1},{"dimension":"claims","frequency":1},{"dimension":"statistics","frequency":0.6666666666666666},{"dimension":"reproducibility","frequency":0.6666666666666666}]},{"domain":"public_policy","label":"Public policy & criminology","reference":{"n":6,"frequency":{"methods":1,"identification":0.16666666666666666,"statistics":0.6666666666666666,"data_code":0.3333333333333333,"claims":1,"reproducibility":0.16666666666666666,"overclaiming":0.5,"generalisation":0.3333333333333333,"theory":0.16666666666666666,"novelty":0.16666666666666666},"breadth":{"min":3,"q1":4.25,"median":5,"q3":5,"max":5,"mean":4.5}},"topDimensions":[{"dimension":"methods","frequency":1},{"dimension":"claims","frequency":1},{"dimension":"statistics","frequency":0.6666666666666666},{"dimension":"overclaiming","frequency":0.5}]},{"domain":"communication","label":"Communication & media","reference":{"n":4,"frequency":{"methods":1,"identification":0.25,"statistics":0.5,"data_code":0,"claims":1,"reproducibility":0.5,"overclaiming":0.5,"generalisation":0.75,"theory":0.25,"novelty":0},"breadth":{"min":4,"q1":4,"median":4.5,"q3":5.25,"max":6,"mean":4.75}},"topDimensions":[{"dimension":"methods","frequency":1},{"dimension":"claims","frequency":1},{"dimension":"generalisation","frequency":0.75},{"dimension":"statistics","frequency":0.5}]},{"domain":"education","label":"Education","reference":{"n":4,"frequency":{"methods":0.5,"identification":0.5,"statistics":0.5,"data_code":0,"claims":1,"reproducibility":0,"overclaiming":0.75,"generalisation":0.75,"theory":0.5,"novelty":0.25},"breadth":{"min":3,"q1":4.5,"median":5,"q3":5.25,"max":6,"mean":4.75}},"topDimensions":[{"dimension":"claims","frequency":1},{"dimension":"overclaiming","frequency":0.75},{"dimension":"generalisation","frequency":0.75},{"dimension":"methods","frequency":0.5}]},{"domain":"management","label":"Management, IS & marketing","reference":{"n":3,"frequency":{"methods":1,"identification":1,"statistics":1,"data_code":0,"claims":0.3333333333333333,"reproducibility":0.6666666666666666,"overclaiming":0,"generalisation":0.3333333333333333,"theory":0,"novelty":0},"breadth":{"min":4,"q1":4,"median":4,"q3":4.5,"max":5,"mean":4.33}},"topDimensions":[{"dimension":"methods","frequency":1},{"dimension":"identification","frequency":1},{"dimension":"statistics","frequency":1},{"dimension":"reproducibility","frequency":0.6666666666666666}]}],"scored":63,"calibrated":17,"mean_alignment":0.721,"results":[{"critiqueId":"CRIT-000013","slug":"peng-copilot-developer-productivity","targetTitle":"The Impact of AI on Developer Productivity: Evidence from GitHub Copilot","accessBasis":"open_access","dimensions":["identification","statistics","generalisation","claims","reproducibility","overclaiming","methods"],"alignment":0.935,"aligned":true,"breadth":7,"breadthBand":"comprehensive","domain":"economics","domainAlignment":0.874,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.94); broader than a typical Comment (7 dimensions vs human median 5)."},{"critiqueId":"CRIT-000002","slug":"brynjolfsson-li-raymond-generative-ai-at-work-qje-2025","targetTitle":"Generative AI at Work","accessBasis":"open_access","dimensions":["identification","methods","statistics","claims","reproducibility","data_code","overclaiming","generalisation"],"alignment":0.924,"aligned":true,"breadth":8,"breadthBand":"comprehensive","domain":"economics","domainAlignment":0.898,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.92); broader than a typical Comment (8 dimensions vs human median 5)."},{"critiqueId":"CRIT-000014","slug":"farach-scaffolding-human-ai-collaboration","targetTitle":"Scaffolding Human–AI Collaboration: A Field Experiment on Behavioral Protocols and Cognitive Reframing","accessBasis":"open_access","dimensions":["identification","statistics","methods","claims","generalisation","reproducibility"],"alignment":0.905,"aligned":true,"breadth":6,"breadthBand":"comprehensive","domain":"management","domainAlignment":0.924,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.91); broader than a typical Comment (6 dimensions vs human median 5)."},{"critiqueId":"CRIT-GEN-when-influencers-delegat","slug":"when-influencers-delegate-replies-how-social-ai-ag","targetTitle":"When Influencers Delegate Replies: How Social AI Agents Shape User Engagement","accessBasis":"abstract_only","dimensions":["identification","statistics","methods","claims","generalisation","reproducibility"],"alignment":0.905,"aligned":true,"breadth":6,"breadthBand":"comprehensive","domain":"management","domainAlignment":0.924,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.91); broader than a typical Comment (6 dimensions vs human median 5)."},{"critiqueId":"CRIT-GEN-more-versus-better-artif","slug":"more-versus-better-artificial-intelligence-incenti","targetTitle":"More Versus Better: Artificial Intelligence, Incentives, and the Emerging Crisis in Peer Review","accessBasis":"user_supplied","dimensions":["identification","methods","statistics","claims","generalisation","overclaiming"],"alignment":0.878,"aligned":true,"breadth":6,"breadthBand":"comprehensive","domain":"management","domainAlignment":0.782,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.88); broader than a typical Comment (6 dimensions vs human median 5)."},{"critiqueId":"CRIT-000031","slug":"ai-chatbots-small-labor-effects","targetTitle":"Large Language Models, Small Labor Market Effects","accessBasis":"open_access","dimensions":["methods","statistics","overclaiming","generalisation","claims"],"alignment":0.869,"aligned":true,"breadth":5,"breadthBand":"typical","domain":"economics","domainAlignment":0.729,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.87); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000024","slug":"ai-empathy-prosocial-behavior-employees","targetTitle":"Effect of AI empathy perception on employees' prosocial behavior: mediating role of warmth and moderating role of AI anthropomorphism","accessBasis":"open_access","dimensions":["statistics","methods","overclaiming","identification","claims"],"alignment":0.85,"aligned":true,"breadth":5,"breadthBand":"typical","domain":"management","domainAlignment":0.778,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.85); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000037","slug":"ai-technostress-mental-health-sem","targetTitle":"Mental health in the “era” of artificial intelligence: technostress and the perceived impact on anxiety and depressive disorders—an SEM analysis","accessBasis":"open_access","dimensions":["identification","statistics","methods","overclaiming","claims"],"alignment":0.85,"aligned":true,"breadth":5,"breadthBand":"typical","domain":"psychology","domainAlignment":0.713,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.85); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000033","slug":"social-media-images-sociopolitical-sentiment","targetTitle":"Investigating the impact of social media images on users' sentiments towards sociopolitical events based on deep artificial intelligence","accessBasis":"open_access","dimensions":["identification","statistics","methods","generalisation","claims"],"alignment":0.846,"aligned":true,"breadth":5,"breadthBand":"typical","domain":"communication","domainAlignment":0.844,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.85); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-GEN-being-literate-behaving-","slug":"being-literate-behaving-literate-a-mixed-methods-a","targetTitle":"Being literate, behaving literate? A mixed-methods approach to adolescents’ algorithm literacy and behavioral strategies on social media","accessBasis":"user_supplied","dimensions":["statistics","methods","claims","generalisation"],"alignment":0.842,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"communication","domainAlignment":0.876,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.84); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-GEN-resilience-and-disempowe","slug":"resilience-and-disempowerment-in-algorithmic-syste","targetTitle":"Resilience and disempowerment in algorithmic systems","accessBasis":"abstract_only","dimensions":["statistics","methods","claims","generalisation"],"alignment":0.842,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"communication","domainAlignment":0.876,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.84); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000009","slug":"the-politics-of-artificial-intelligence-alignment","targetTitle":"The politics of artificial intelligence alignment: Public reactions to AI moderation in the case of Google’s Gemini","accessBasis":"abstract_only","dimensions":["generalisation","statistics","claims","methods"],"alignment":0.842,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"political_science","domainAlignment":0.737,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.84); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000028","slug":"llm-effects-unemployment-earnings","targetTitle":"The (Short-Term) Effects of Large Language Models on Unemployment and Earnings","accessBasis":"open_access","dimensions":["statistics","identification","methods","claims"],"alignment":0.822,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"economics","domainAlignment":0.872,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.82); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000026","slug":"racial-disparities-time-to-recidivism","targetTitle":"Fairness Is More Than Algorithms: Racial Disparities in Time-to-Recidivism","accessBasis":"open_access","dimensions":["statistics","identification","methods","claims"],"alignment":0.822,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"public_policy","domainAlignment":0.814,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.82); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000044","slug":"conversational-persuasiveness-gpt4","targetTitle":"On the conversational persuasiveness of GPT-4","accessBasis":"open_access","dimensions":["overclaiming","methods","claims","reproducibility"],"alignment":0.805,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"psychology","domainAlignment":0.763,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.81); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000012","slug":"generative-ai-propaganda-and-digital-authoritarian","targetTitle":"Generative AI, propaganda, and digital authoritarianism: Comparative insights from six democratically weakened countries","accessBasis":"abstract_only","dimensions":["generalisation","claims","methods","reproducibility"],"alignment":0.801,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"communication","domainAlignment":0.876,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.80); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000010","slug":"refusal-as-silence-gendered-disparities-in-vision","targetTitle":"Refusal as silence: Gendered disparities in Vision-Language Model responses","accessBasis":"abstract_only","dimensions":["generalisation","reproducibility","claims","methods"],"alignment":0.801,"aligned":true,"breadth":4,"breadthBand":"typical","domain":"sociology","domainAlignment":0.792,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"calibrated","note":"attends to the expert-emphasised lenses (alignment 0.80); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-GEN-the-rise-of-ai-sovereign","slug":"the-rise-of-ai-sovereignty","targetTitle":"The rise of AI sovereignty: Authoritarian technological imaginaries as a form of reflexive control","accessBasis":"user_supplied","dimensions":["theory","claims","generalisation","overclaiming","methods","reproducibility"],"alignment":0.796,"aligned":false,"breadth":6,"breadthBand":"comprehensive","domain":"political_science","domainAlignment":0.722,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.80 < 0.8); broader than a typical Comment (6 dimensions vs human median 5)."},{"critiqueId":"CRIT-GEN-scp-artificial-intellige","slug":"scp-artificial-intelligence-scp-adoption-and-the-d","targetTitle":"Artificial intelligence adoption and the demand for managerial expertise","accessBasis":"abstract_only","dimensions":["methods","statistics","claims","theory","generalisation"],"alignment":0.794,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"management","domainAlignment":0.623,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.79 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000035","slug":"ai-social-media-political-competition-democracy","targetTitle":"Artificial intelligence and social media as new arenas of political competition: challenges for democracy","accessBasis":"open_access","dimensions":["overclaiming","methods","data_code","reproducibility","claims"],"alignment":0.783,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"political_science","domainAlignment":0.817,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.78 < 0.8); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-GEN-how-costs-influence-pref","slug":"how-costs-influence-preferences-for-control-in-gen","targetTitle":"How Costs Influence Preferences for Control in Generative Artificial Intelligence (GenAI): Human-Guided vs. GenAI-Based Delegated Search","accessBasis":"abstract_only","dimensions":["identification","methods","claims","overclaiming","theory","reproducibility"],"alignment":0.779,"aligned":false,"breadth":6,"breadthBand":"comprehensive","domain":"management","domainAlignment":0.64,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.78 < 0.8); full-text review needed to reach the calibrated standard; broader than a typical Comment (6 dimensions vs human median 5)."},{"critiqueId":"CRIT-000016","slug":"cultural-bias-alignment-llms","targetTitle":"Cultural bias and cultural alignment of large language models","accessBasis":"abstract_only","dimensions":["generalisation","methods","overclaiming","claims"],"alignment":0.768,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"sociology","domainAlignment":0.748,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.77 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000003","slug":"the-cybernetic-teammate-a-field-experiment-on-gene","targetTitle":"The Cybernetic Teammate: A Field Experiment on Generative AI and Teamwork","accessBasis":"user_supplied","dimensions":["generalisation","claims","methods","overclaiming"],"alignment":0.768,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"management","domainAlignment":0.435,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.77 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000029","slug":"genai-classroom-teaching-university-teachers","targetTitle":"Factors influencing the adoption of generative artificial intelligence into classroom teaching by university teachers: An empirical study using SPSS PROCESS macros","accessBasis":"open_access","dimensions":["statistics","identification","reproducibility","overclaiming","claims"],"alignment":0.765,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"education","domainAlignment":0.689,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.77 < 0.8); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000034","slug":"chatgpt-acceptance-higher-education-utaut2","targetTitle":"Exploring the acceptance of ChatGPT in higher education: a comprehensive quantitative study of university students and faculty","accessBasis":"open_access","dimensions":["statistics","identification","generalisation","reproducibility","claims"],"alignment":0.761,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"education","domainAlignment":0.689,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.76 < 0.8); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000048","slug":"real-time-ai-sentiment-self-moderation","targetTitle":"Real-time artificial intelligence sentiment feedback promotes self-moderation in contentious online discussion","accessBasis":"licensed_access","dimensions":["overclaiming","statistics","methods","reproducibility"],"alignment":0.751,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"communication","domainAlignment":0.674,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.75 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000018","slug":"genai-usage-university-students-harmful-helpful","targetTitle":"Is it harmful or helpful? Examining the causes and consequences of generative AI usage among university students","accessBasis":"abstract_only","dimensions":["identification","methods","claims","overclaiming"],"alignment":0.747,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"education","domainAlignment":0.77,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.75 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000008","slug":"ai-meets-politics-examining-the-effects-of-differe","targetTitle":"AI meets politics: Examining the effects of different targeting strategies across 15 countries","accessBasis":"user_supplied","dimensions":["generalisation","claims","methods","identification"],"alignment":0.743,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"political_science","domainAlignment":0.619,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.74 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000049","slug":"multimodal-llm-context-sensitive-hate-speech","targetTitle":"Multimodal large language models can make context-sensitive hate speech evaluations aligned with human judgement","accessBasis":"licensed_access","dimensions":["overclaiming","claims","methods"],"alignment":0.743,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"other","domainAlignment":null,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.74 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000019","slug":"student-perspectives-generative-ai-higher-ed","targetTitle":"Student perspectives on the use of generative artificial intelligence technologies in higher education","accessBasis":"abstract_only","dimensions":["generalisation","methods","claims","identification"],"alignment":0.743,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"education","domainAlignment":0.77,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.74 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000032","slug":"ai-voice-similarity-likability-trust","targetTitle":"AI-determined similarity increases likability and trustworthiness of human voices","accessBasis":"open_access","dimensions":["overclaiming","identification","statistics","generalisation","claims"],"alignment":0.731,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"psychology","domainAlignment":0.589,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.73 < 0.8); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-GEN-algorithmic-responsibili","slug":"algorithmic-responsibility-in-ppc-practice-interpr","targetTitle":"Algorithmic responsibility in PPC practice: Interpreting black boxes in digital advertising work","accessBasis":"abstract_only","dimensions":["methods","claims","theory","generalisation","overclaiming"],"alignment":0.728,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"sociology","domainAlignment":0.748,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.73 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-GEN-from-prompt-engineering-","slug":"from-prompt-engineering-to-prompt-design-research","targetTitle":"From prompt engineering to prompt design: Research strategies for visual generative AI","accessBasis":"abstract_only","dimensions":["theory","methods","claims","generalisation","overclaiming"],"alignment":0.728,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"communication","domainAlignment":0.844,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.73 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-GEN-making-genai-valuable-be","slug":"making-genai-valuable-benchmarks-singularities-and","targetTitle":"Making GenAI valuable: Benchmarks, singularities, and the enrichment economy","accessBasis":"user_supplied","dimensions":["theory","claims","generalisation","overclaiming","methods"],"alignment":0.728,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"sociology","domainAlignment":0.748,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.73 < 0.8); breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000038","slug":"genai-college-student-learning-engagement","targetTitle":"Whether and When Could Generative AI Improve College Student Learning Engagement?","accessBasis":"open_access","dimensions":["identification","statistics","methods","reproducibility"],"alignment":0.726,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"education","domainAlignment":0.42,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.73 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000027","slug":"welfare-ai-claimant-preferences","targetTitle":"Heterogeneous preferences and asymmetric insights for AI use among welfare claimants and non-claimants","accessBasis":"open_access","dimensions":["statistics","overclaiming","generalisation","claims"],"alignment":0.714,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"public_policy","domainAlignment":0.718,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.71 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000039","slug":"ai-education-learners-eyes-perceptions-challenges","targetTitle":"AI in education through the learners’ eyes: practical experience, perceptions, and challenges","accessBasis":"open_access","dimensions":["identification","statistics","methods","overclaiming"],"alignment":0.693,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"education","domainAlignment":0.63,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.69 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000030","slug":"ai-tutoring-rct-active-learning","targetTitle":"AI tutoring outperforms in-class active learning: an RCT introducing a novel research-based design in an authentic educational setting","accessBasis":"open_access","dimensions":["identification","overclaiming","statistics","claims"],"alignment":0.693,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"education","domainAlignment":0.77,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.69 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000020","slug":"inconsistent-advice-chatgpt-decision-making","targetTitle":"Inconsistent advice by ChatGPT influences decision making in various areas","accessBasis":"open_access","dimensions":["identification","statistics","overclaiming","claims"],"alignment":0.693,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"psychology","domainAlignment":0.555,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.69 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000041","slug":"political-ideology-ai-policy-making","targetTitle":"Political ideology shapes support for the use of AI in policy-making","accessBasis":"open_access","dimensions":["identification","statistics","methods","overclaiming"],"alignment":0.693,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"political_science","domainAlignment":0.707,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.69 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000015","slug":"theory-of-mind-llms-humans","targetTitle":"Testing theory of mind in large language models and humans","accessBasis":"abstract_only","dimensions":["theory","methods","overclaiming","claims"],"alignment":0.689,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"psychology","domainAlignment":0.555,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.69 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-GEN-beyond-disruption-and-in","slug":"beyond-disruption-and-invisibility-interactional-c","targetTitle":"Beyond disruption and invisibility: Interactional continuity in everyday AI use in India","accessBasis":"user_supplied","dimensions":["generalisation","claims","methods","theory"],"alignment":0.685,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"communication","domainAlignment":0.809,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.69 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-GEN-crafting-computer-vision","slug":"crafting-computer-vision-through-human-eyes-an-ai","targetTitle":"Crafting computer vision through human eyes: An AI laboratory ethnography","accessBasis":"abstract_only","dimensions":["generalisation","claims","methods","theory"],"alignment":0.685,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"sociology","domainAlignment":0.704,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.69 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-GEN-into-the-black-box-laype","slug":"into-the-black-box-laypeople-s-folk-theories-about","targetTitle":"Into the black box: Laypeople's folk theories about generative artificial intelligence chatbots","accessBasis":"user_supplied","dimensions":["claims","methods","generalisation","theory"],"alignment":0.685,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"communication","domainAlignment":0.809,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.69 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-GEN-working-the-algorithm-co","slug":"working-the-algorithm-contextual-skills-of-on-dema","targetTitle":"Working the algorithm: Contextual skills of on-demand gig workers","accessBasis":"abstract_only","dimensions":["methods","claims","generalisation","theory"],"alignment":0.685,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"sociology","domainAlignment":0.704,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.69 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000040","slug":"ai-regulation-support-bayesian-network","targetTitle":"Understanding support for AI regulation: A Bayesian network perspective","accessBasis":"open_access","dimensions":["statistics","overclaiming","methods"],"alignment":0.68,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"political_science","domainAlignment":0.68,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.68 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000023","slug":"ai-self-preferencing-algorithmic-hiring","targetTitle":"AI Self-preferencing in Algorithmic Hiring: Empirical Evidence and Insights","accessBasis":"open_access","dimensions":["methods","statistics","generalisation"],"alignment":0.676,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"economics","domainAlignment":0.591,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.68 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000025","slug":"local-us-officials-views-ai-governance","targetTitle":"Local US officials' views on the impacts and governance of AI: Evidence from 2022 and 2023 survey waves","accessBasis":"open_access","dimensions":["statistics","identification","claims"],"alignment":0.652,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"political_science","domainAlignment":0.646,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.65 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000021","slug":"postgraduate-students-perceptions-ai-research-plos","targetTitle":"Postgraduate students' perceptions of artificial intelligence integration in research: A cross-sectional study","accessBasis":"open_access","dimensions":["overclaiming","identification","methods","reproducibility"],"alignment":0.652,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"education","domainAlignment":0.49,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.65 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000042","slug":"positioning-political-texts-llm-asking-averaging","targetTitle":"Positioning Political Texts with Large Language Models by Asking and Averaging","accessBasis":"open_access","dimensions":["identification","methods","statistics","data_code"],"alignment":0.635,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"political_science","domainAlignment":0.707,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.64 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000043","slug":"human-ai-feedback-loops-bias-amplification","targetTitle":"How human–AI feedback loops alter human perceptual, emotional and social judgements","accessBasis":"open_access","dimensions":["overclaiming","methods","reproducibility","data_code"],"alignment":0.618,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"psychology","domainAlignment":0.52,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.62 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000017","slug":"genai-creativity-collective-diversity","targetTitle":"Generative AI enhances individual creativity but reduces the collective diversity of novel content","accessBasis":"abstract_only","dimensions":["claims","generalisation","overclaiming","identification"],"alignment":0.614,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"psychology","domainAlignment":0.416,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.61 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-GEN-backfiring-ai-ai-deploym","slug":"backfiring-ai-ai-deployment-in-workplace","targetTitle":"Backfiring AI? AI Deployment in Workplace","accessBasis":"abstract_only","dimensions":["theory","generalisation","claims","overclaiming","reproducibility","novelty"],"alignment":0.596,"aligned":false,"breadth":6,"breadthBand":"comprehensive","domain":"management","domainAlignment":0.284,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.60 < 0.8); full-text review needed to reach the calibrated standard; broader than a typical Comment (6 dimensions vs human median 5)."},{"critiqueId":"CRIT-000022","slug":"when-ai-judges-your-work","targetTitle":"When an AI Judges Your Work: The Hidden Costs of Algorithmic Assessment","accessBasis":"open_access","dimensions":["identification","overclaiming","methods"],"alignment":0.565,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"psychology","domainAlignment":0.36,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.56 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000006","slug":"can-chatgpt-kill-user-generated-qa-platforms","targetTitle":"Can ChatGPT Kill User-Generated Q&A Platforms?","accessBasis":"abstract_only","dimensions":["generalisation","identification","claims"],"alignment":0.561,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"management","domainAlignment":0.503,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.56 < 0.8); full-text review needed to reach the calibrated standard; more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000004","slug":"artificial-collusion-examining-supracompetitive-pr","targetTitle":"Artificial Collusion: Examining Supracompetitive Pricing by Q-Learning Algorithms","accessBasis":"abstract_only","dimensions":["generalisation","overclaiming","claims","theory"],"alignment":0.556,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"economics","domainAlignment":0.36,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.56 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000011","slug":"from-rule-of-law-to-rule-of-algorithm-generative-a","targetTitle":"From rule of law to rule of algorithm: Generative Artificial Intelligence's threat to democracy","accessBasis":"user_supplied","dimensions":["claims","overclaiming","theory","generalisation"],"alignment":0.556,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"political_science","domainAlignment":0.471,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.56 < 0.8); breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000005","slug":"unraveling-generative-ai-from-a-human-intelligence","targetTitle":"Unraveling Generative AI from a Human Intelligence Perspective: A Battery of Experiments","accessBasis":"abstract_only","dimensions":["theory","overclaiming","generalisation","claims"],"alignment":0.556,"aligned":false,"breadth":4,"breadthBand":"typical","domain":"psychology","domainAlignment":0.416,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.56 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (4 dimensions)."},{"critiqueId":"CRIT-000046","slug":"perceived-human-vs-ai-empathy","targetTitle":"Comparing the value of perceived human versus AI-generated empathy","accessBasis":"licensed_access","dimensions":["methods","overclaiming","data_code"],"alignment":0.527,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"psychology","domainAlignment":0.32,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.53 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-GEN-charismatic-machines-on-","slug":"charismatic-machines-on-the-epistemic-power-of-gen","targetTitle":"Charismatic machines: On the epistemic power of generative AI within platform convergence","accessBasis":"abstract_only","dimensions":["theory","claims","novelty","overclaiming","generalisation"],"alignment":0.509,"aligned":false,"breadth":5,"breadthBand":"typical","domain":"communication","domainAlignment":0.603,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.51 < 0.8); full-text review needed to reach the calibrated standard; breadth typical of the genre (5 dimensions)."},{"critiqueId":"CRIT-000047","slug":"reducing-political-polarization-ai-conversations","targetTitle":"Reducing political polarization through conversations with artificial intelligence","accessBasis":"licensed_access","dimensions":["overclaiming","methods","theory"],"alignment":0.498,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"political_science","domainAlignment":0.442,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.50 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000007","slug":"made-with-ai-consumer-engagement-with-social-media","targetTitle":"Made With AI: Consumer Engagement with Social Media Containing AI Disclosures","accessBasis":"abstract_only","dimensions":["generalisation","claims","theory"],"alignment":0.494,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"management","domainAlignment":0.201,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"scope-limited by abstract-only access — cannot reach the methods/statistics/identification lenses experts emphasise (alignment 0.49 < 0.8); full-text review needed to reach the calibrated standard; more focused than a typical critique (3 dimensions vs human median 5)."},{"critiqueId":"CRIT-000045","slug":"cultural-tendencies-generative-ai","targetTitle":"Cultural tendencies in generative AI","accessBasis":"licensed_access","dimensions":["overclaiming","identification","generalisation"],"alignment":0.412,"aligned":false,"breadth":3,"breadthBand":"focused","domain":"psychology","domainAlignment":0.2,"disciplined":true,"disciplineErrors":[],"grounding":1,"grounded":true,"verdict":"needs_review","note":"under-attends to the expert-emphasised lenses (alignment 0.41 < 0.8); more focused than a typical critique (3 dimensions vs human median 5)."}]}