{"data":{"id":"002874c9-3d69-4a57-bda7-a9633bc29c79","title":"Model-Based Offline Reinforcement Learning With Adversarial Data Augmentation","summary":"Model-based offline reinforcement learning (RL, where an AI learns to make decisions from a fixed dataset without interacting with a live environment) struggles because static data makes it hard to develop robust policies. This paper introduces MORAL, which uses adversarial data augmentation (a technique where competing AI models deliberately generate challenging training examples to improve robustness) to dynamically enrich training data and improve policy learning instead of using traditional fixed rollout methods.","solution":"N/A -- no mitigation discussed in source.","labels":["research"],"sourceUrl":"http://ieeexplore.ieee.org/document/11271829","publishedAt":"2025-12-02T13:16:34.000Z","cveId":null,"cweIds":null,"cvssScore":null,"cvssSeverity":null,"severity":"info","attackType":[],"issueType":"research","affectedPackages":null,"affectedVendors":[],"affectedVendorsRaw":[],"classifierModel":"claude-haiku-4-5-20251001","classifierPromptVersion":"v3","cvssVector":null,"attackVector":null,"attackComplexity":null,"privilegesRequired":null,"userInteraction":null,"exploitMaturity":null,"epssScore":null,"patchAvailable":null,"disclosureDate":"2025-12-02T13:16:34.000Z","capecIds":null,"crossRefCount":0,"attackSophistication":"moderate","impactType":null,"aiComponentTargeted":"training_data","llmSpecific":false,"classifierConfidence":0.85,"researchCategory":"peer_reviewed","atlasIds":null}}