<owl:Class xmlns="https://folio.openlegalstandard.org/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:v1="http://www.loc.gov/mads/rdf/v1#" xmlns:owl="http://www.w3.org/2002/07/owl#" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:xsd="http://www.w3.org/2001/XMLSchema#" xmlns:folio="https://folio.openlegalstandard.org/" xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#" xmlns:skos="http://www.w3.org/2004/02/skos/core#" rdf:about="https://folio.openlegalstandard.org/RCQ5aTqEDpPwcRvtzkx0T6e">
  <rdfs:subClassOf rdf:resource="https://folio.openlegalstandard.org/RBHMad8oNmYXkYHOHZLCgqv"/>
  <rdfs:label>Reinforcement Learning</rdfs:label>
  <skos:prefLabel>RL</skos:prefLabel>
  <skos:definition>Reinforcement Learning (RL) is a subset of machine learning that enables an artificial system, or agent, to optimize its behavior in a given environment by learning from feedback signals, such as rewards or punishments. The goal is to maximize the cumulative reward received, which is determined by a reward function representing the system's objectives (e.g., answering legal questions, drafting legal documents).</skos:definition>
</owl:Class>