• bitcoinBitcoin(BTC)$77,259.00-1.57%
  • ethereumEthereum(ETH)$2,300.67-2.61%
  • tetherTether(USDT)$1.00-0.02%
  • rippleXRP(XRP)$1.40-2.12%
  • binancecoinBNB(BNB)$626.34-1.35%
  • usd-coinUSDC(USDC)$1.000.00%
  • solanaSolana(SOL)$84.62-2.50%
  • tronTRON(TRX)$0.3252720.53%
  • Figure HelocFigure Heloc(FIGR_HELOC)$1.031.24%
  • dogecoinDogecoin(DOGE)$0.098664-0.40%
  • whitebitWhiteBIT Coin(WBT)$54.61-1.65%
  • USDSUSDS(USDS)$1.00-0.07%
  • HyperliquidHyperliquid(HYPE)$41.70-1.70%
  • leo-tokenLEO Token(LEO)$10.37-0.01%
  • cardanoCardano(ADA)$0.247624-1.94%
  • bitcoin-cashBitcoin Cash(BCH)$451.17-0.68%
  • moneroMonero(XMR)$378.68-3.47%
  • chainlinkChainlink(LINK)$9.31-1.60%
  • zcashZcash(ZEC)$352.99-1.55%
  • CantonCanton(CC)$0.147598-1.84%
  • stellarStellar(XLM)$0.165824-3.01%
  • MemeCoreMemeCore(M)$3.79-12.06%
  • daiDai(DAI)$1.000.01%
  • USD1USD1(USD1)$1.000.00%
  • litecoinLitecoin(LTC)$55.50-1.15%
  • avalanche-2Avalanche(AVAX)$9.24-2.15%
  • hedera-hashgraphHedera(HBAR)$0.089564-2.91%
  • Ethena USDeEthena USDe(USDE)$1.00-0.02%
  • suiSui(SUI)$0.93-1.32%
  • shiba-inuShiba Inu(SHIB)$0.000006-1.31%
  • RainRain(RAIN)$0.007218-3.80%
  • paypal-usdPayPal USD(PYUSD)$1.00-0.02%
  • the-open-networkToncoin(TON)$1.310.46%
  • crypto-com-chainCronos(CRO)$0.069594-0.91%
  • Circle USYCCircle USYC(USYC)$1.12-0.01%
  • tether-goldTether Gold(XAUT)$4,687.860.31%
  • Global DollarGlobal Dollar(USDG)$1.00-0.02%
  • BittensorBittensor(TAO)$248.48-1.42%
  • World Liberty FinancialWorld Liberty Financial(WLFI)$0.072814-2.91%
  • BlackRock USD Institutional Digital Liquidity FundBlackRock USD Institutional Digital Liquidity Fund(BUIDL)$1.000.00%
  • pax-goldPAX Gold(PAXG)$4,686.070.31%
  • mantleMantle(MNT)$0.64-2.70%
  • polkadotPolkadot(DOT)$1.23-2.22%
  • uniswapUniswap(UNI)$3.24-0.87%
  • SkySky(SKY)$0.0886040.52%
  • Pi NetworkPi Network(PI)$0.1858253.90%
  • Falcon USDFalcon USD(USDF)$1.00-0.05%
  • nearNEAR Protocol(NEAR)$1.36-2.55%
  • okbOKB(OKB)$83.69-0.97%
  • HTX DAOHTX DAO(HTX)$0.0000021.28%
TradePoint.io
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop
No Result
View All Result
TradePoint.io
No Result
View All Result

Build a Reinforcement Learning Powered Agent that Learns to Retrieve Relevant Long-Term Memories for Accurate LLM Question Answering

April 27, 2026
in AI & Technology
Reading Time: 3 mins read
A A
Build a Reinforcement Learning Powered Agent that Learns to Retrieve Relevant Long-Term Memories for Accurate LLM Question Answering
ShareShareShareShareShare

YOU MAY ALSO LIKE

US Is Doubling Down on Tech Deals with the Gulf: Helberg

Musk, Altman Feud Heads to Court Over Future of OpenAI

@dataclass
class MemoryItem:
   memory_id: int
   topic: str
   entity: str
   slot: str
   value: str
   text: str


def build_memory_bank() -> List[MemoryItem]:
   entities = [
       {
           "entity": "Astra",
           "topic": "robotics",
           "facts": {
               "battery": "18 hours",
               "sensor": "LiDAR",
               "country": "Japan",
               "release_year": "2023",
               "specialty": "warehouse navigation",
           },
       },
       {
           "entity": "Orion",
           "topic": "astronomy",
           "facts": {
               "telescope": "infrared array",
               "country": "Chile",
               "discovery_year": "2019",
               "target": "exoplanet atmospheres",
               "aperture": "8 meters",
           },
       },
       {
           "entity": "Vita",
           "topic": "biomedicine",
           "facts": {
               "compound": "VX-17",
               "trial_phase": "Phase II",
               "country": "Canada",
               "target": "inflammatory markers",
               "delivery": "oral capsule",
           },
       },
       {
           "entity": "Nimbus",
           "topic": "climate",
           "facts": {
               "satellite": "polar orbiter",
               "country": "Norway",
               "launch_year": "2022",
               "instrument": "microwave radiometer",
               "mission": "sea ice monitoring",
           },
       },
       {
           "entity": "Atlas",
           "topic": "logistics",
           "facts": {
               "fleet_size": "240 trucks",
               "hub": "Muscat",
               "software": "predictive routing",
               "fuel_policy": "hybrid-first",
               "region": "GCC",
           },
       },
       {
           "entity": "Lumos",
           "topic": "materials",
           "facts": {
               "alloy": "Ti-6Al-4V",
               "process": "laser sintering",
               "density": "4.43 g/cm3",
               "country": "Germany",
               "use_case": "aerospace brackets",
           },
       },
       {
           "entity": "Cedar",
           "topic": "agriculture",
           "facts": {
               "crop": "wheat",
               "irrigation": "drip control",
               "country": "India",
               "yield_gain": "12 percent",
               "soil_sensor": "capacitive probe",
           },
       },
       {
           "entity": "Pulse",
           "topic": "healthcare",
           "facts": {
               "device": "ECG patch",
               "battery": "7 days",
               "country": "USA",
               "connectivity": "Bluetooth Low Energy",
               "use_case": "arrhythmia screening",
           },
       },
   ]


   phrasing_templates = [
       "{entity} in {topic} uses {value} for {slot}.",
       "The {slot} associated with {entity} is {value}.",
       "{entity} has {slot}: {value}.",
       "For {entity}, the recorded {slot} is {value}.",
       "Reference note: {entity} -> {slot} = {value}.",
   ]


   distractor_templates = [
       "{entity} was discussed in a briefing about cross-domain innovation.",
       "{entity} has been compared with several other projects in recent reports.",
       "A summary note mentions {entity} among notable initiatives.",
       "{entity} appears in a high-level update without technical details.",
       "Stakeholders reviewed {entity} in a strategic planning session.",
   ]


   memory_bank = []
   memory_id = 0


   for item in entities:
       entity = item["entity"]
       topic = item["topic"]
       for slot, value in item["facts"].items():
           for t in phrasing_templates:
               text = t.format(entity=entity, topic=topic, slot=slot, value=value)
               memory_bank.append(MemoryItem(
                   memory_id=memory_id,
                   topic=topic,
                   entity=entity,
                   slot=slot,
                   value=value,
                   text=text
               ))
               memory_id += 1


       for t in distractor_templates:
           text = t.format(entity=entity)
           memory_bank.append(MemoryItem(
               memory_id=memory_id,
               topic=topic,
               entity=entity,
               slot="distractor",
               value="n/a",
               text=text
           ))
           memory_id += 1


   extra_noise = [
       "General note: system maintenance occurred on Tuesday.",
       "A committee discussed budget timelines and operational readiness.",
       "The archive includes summaries of projects across multiple departments.",
       "No relevant technical value is stated in this memory.",
       "A status update mentioned partnerships and future opportunities.",
       "An unrelated note references shipping delays and staffing changes.",
       "Background memo: the team reviewed dashboards and reporting cadence.",
       "This memory contains no answer-bearing facts.",
   ]


   for text in extra_noise:
       memory_bank.append(MemoryItem(
           memory_id=memory_id,
           topic="noise",
           entity="none",
           slot="distractor",
           value="n/a",
           text=text
       ))
       memory_id += 1


   return memory_bank


memory_bank = build_memory_bank()
memory_texts = [m.text for m in memory_bank]
memory_embeddings = embed_texts(memory_texts)


def build_queries(memory_bank: List[MemoryItem]) -> List[Dict[str, Any]]:
   patterns = [
       "What is the {slot} of {entity}?",
       "Which {slot} does {entity} have?",
       "Tell me the {slot} for {entity}.",
       "Can you recall the {slot} associated with {entity}?",
       "What was recorded as the {slot} of {entity}?",
   ]
   queries = []
   qid = 0
   for m in memory_bank:
       if m.slot == "distractor":
           continue
       q = random.choice(patterns).format(slot=m.slot.replace("_", " "), entity=m.entity)
       queries.append({
           "query_id": qid,
           "query": q,
           "entity": m.entity,
           "slot": m.slot,
           "gold_value": m.value,
           "gold_memory_id": m.memory_id,
           "gold_text": m.text,
           "topic": m.topic,
       })
       qid += 1
   random.shuffle(queries)
   return queries


queries = build_queries(memory_bank)
query_texts = [q["query"] for q in queries]
query_embeddings = embed_texts(query_texts)

Credit: Source link

ShareTweetSendSharePin

Related Posts

US Is Doubling Down on Tech Deals with the Gulf: Helberg
AI & Technology

US Is Doubling Down on Tech Deals with the Gulf: Helberg

April 28, 2026
Musk, Altman Feud Heads to Court Over Future of OpenAI
AI & Technology

Musk, Altman Feud Heads to Court Over Future of OpenAI

April 28, 2026
Big Job Cuts Come Ahead of Big Tech Earnings
AI & Technology

Big Job Cuts Come Ahead of Big Tech Earnings

April 27, 2026
OpenAI Drops Exclusivity Deal with Microsoft | Bloomberg Tech 4/27/2026
AI & Technology

OpenAI Drops Exclusivity Deal with Microsoft | Bloomberg Tech 4/27/2026

April 27, 2026
Next Post
Open source Xiaomi MiMo-V2.5 and V2.5-Pro are among the most efficient (and affordable) at agentic ‘claw’ tasks

Open source Xiaomi MiMo-V2.5 and V2.5-Pro are among the most efficient (and affordable) at agentic 'claw' tasks

Leave a Reply Cancel reply

Your email address will not be published. Required fields are marked *

Search

No Result
View All Result
Titanium Court mashes together genres and cultural references to tell a strange, funny tale

Titanium Court mashes together genres and cultural references to tell a strange, funny tale

April 23, 2026
Mend Releases AI Security Governance Framework: Covering Asset Inventory, Risk Tiering, AI Supply Chain Security, and Maturity Model

Mend Releases AI Security Governance Framework: Covering Asset Inventory, Risk Tiering, AI Supply Chain Security, and Maturity Model

April 24, 2026
Why people in Lebanon remain wary of ceasefire agreement with Israel

Why people in Lebanon remain wary of ceasefire agreement with Israel

April 21, 2026

About

Learn more

Our Services

Legal

Privacy Policy

Terms of Use

Bloggers

Learn more

Article Links

Contact

Advertise

Ask us anything

©2020- TradePoint.io - All rights reserved!

Tradepoint.io, being just a publishing and technology platform, is not a registered broker-dealer or investment adviser. So we do not provide investment advice. Rather, brokerage services are provided to clients of Tradepoint.io by independent SEC-registered broker-dealers and members of FINRA/SIPC. Every form of investing carries some risk and past performance is not a guarantee of future results. “Tradepoint.io“, “Instant Investing” and “My Trading Tools” are registered trademarks of Apperbuild, LLC.

This website is operated by Apperbuild, LLC. We have no link to any brokerage firm and we do not provide investment advice. Every information and resource we provide is solely for the education of our readers. © 2020 Apperbuild, LLC. All rights reserved.

No Result
View All Result
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop

© 2023 - TradePoint.io - All Rights Reserved!