• bitcoinBitcoin(BTC)$77,115.00-2.56%
  • ethereumEthereum(ETH)$2,299.12-3.80%
  • tetherTether(USDT)$1.00-0.02%
  • rippleXRP(XRP)$1.40-3.04%
  • binancecoinBNB(BNB)$626.07-1.93%
  • usd-coinUSDC(USDC)$1.000.00%
  • solanaSolana(SOL)$84.41-3.70%
  • tronTRON(TRX)$0.3248210.39%
  • Figure HelocFigure Heloc(FIGR_HELOC)$1.031.24%
  • dogecoinDogecoin(DOGE)$0.099354-0.72%
  • whitebitWhiteBIT Coin(WBT)$54.53-2.66%
  • USDSUSDS(USDS)$1.00-0.07%
  • HyperliquidHyperliquid(HYPE)$41.45-3.32%
  • leo-tokenLEO Token(LEO)$10.370.02%
  • cardanoCardano(ADA)$0.248002-2.82%
  • bitcoin-cashBitcoin Cash(BCH)$449.11-1.69%
  • moneroMonero(XMR)$380.10-2.91%
  • chainlinkChainlink(LINK)$9.30-2.62%
  • zcashZcash(ZEC)$354.16-0.87%
  • CantonCanton(CC)$0.147868-2.11%
  • stellarStellar(XLM)$0.165514-4.08%
  • MemeCoreMemeCore(M)$3.74-13.03%
  • USD1USD1(USD1)$1.000.00%
  • daiDai(DAI)$1.00-0.02%
  • litecoinLitecoin(LTC)$55.47-2.01%
  • avalanche-2Avalanche(AVAX)$9.25-2.89%
  • hedera-hashgraphHedera(HBAR)$0.089508-3.64%
  • Ethena USDeEthena USDe(USDE)$1.00-0.01%
  • suiSui(SUI)$0.93-2.45%
  • shiba-inuShiba Inu(SHIB)$0.000006-2.19%
  • RainRain(RAIN)$0.007237-4.78%
  • paypal-usdPayPal USD(PYUSD)$1.000.00%
  • the-open-networkToncoin(TON)$1.31-0.68%
  • crypto-com-chainCronos(CRO)$0.069535-1.44%
  • Circle USYCCircle USYC(USYC)$1.120.00%
  • tether-goldTether Gold(XAUT)$4,667.80-0.41%
  • Global DollarGlobal Dollar(USDG)$1.000.00%
  • BittensorBittensor(TAO)$247.56-2.60%
  • World Liberty FinancialWorld Liberty Financial(WLFI)$0.072885-2.92%
  • BlackRock USD Institutional Digital Liquidity FundBlackRock USD Institutional Digital Liquidity Fund(BUIDL)$1.000.00%
  • pax-goldPAX Gold(PAXG)$4,666.00-0.48%
  • mantleMantle(MNT)$0.64-3.43%
  • polkadotPolkadot(DOT)$1.24-2.39%
  • SkySky(SKY)$0.0885700.70%
  • uniswapUniswap(UNI)$3.24-2.09%
  • Pi NetworkPi Network(PI)$0.1888184.69%
  • Falcon USDFalcon USD(USDF)$1.000.05%
  • okbOKB(OKB)$84.01-1.07%
  • nearNEAR Protocol(NEAR)$1.36-3.17%
  • HTX DAOHTX DAO(HTX)$0.0000020.84%
TradePoint.io
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop
No Result
View All Result
TradePoint.io
No Result
View All Result

Build a Reinforcement Learning Powered Agent that Learns to Retrieve Relevant Long-Term Memories for Accurate LLM Question Answering

April 27, 2026
in AI & Technology
Reading Time: 3 mins read
A A
Build a Reinforcement Learning Powered Agent that Learns to Retrieve Relevant Long-Term Memories for Accurate LLM Question Answering
ShareShareShareShareShare

YOU MAY ALSO LIKE

Xiaomi’s Electric Supercar Threatens Porsche, Europe Models

Why DeepSeek V4 Impresses Despite Lack of ‘Wow’ Factor

@dataclass
class MemoryItem:
   memory_id: int
   topic: str
   entity: str
   slot: str
   value: str
   text: str


def build_memory_bank() -> List[MemoryItem]:
   entities = [
       {
           "entity": "Astra",
           "topic": "robotics",
           "facts": {
               "battery": "18 hours",
               "sensor": "LiDAR",
               "country": "Japan",
               "release_year": "2023",
               "specialty": "warehouse navigation",
           },
       },
       {
           "entity": "Orion",
           "topic": "astronomy",
           "facts": {
               "telescope": "infrared array",
               "country": "Chile",
               "discovery_year": "2019",
               "target": "exoplanet atmospheres",
               "aperture": "8 meters",
           },
       },
       {
           "entity": "Vita",
           "topic": "biomedicine",
           "facts": {
               "compound": "VX-17",
               "trial_phase": "Phase II",
               "country": "Canada",
               "target": "inflammatory markers",
               "delivery": "oral capsule",
           },
       },
       {
           "entity": "Nimbus",
           "topic": "climate",
           "facts": {
               "satellite": "polar orbiter",
               "country": "Norway",
               "launch_year": "2022",
               "instrument": "microwave radiometer",
               "mission": "sea ice monitoring",
           },
       },
       {
           "entity": "Atlas",
           "topic": "logistics",
           "facts": {
               "fleet_size": "240 trucks",
               "hub": "Muscat",
               "software": "predictive routing",
               "fuel_policy": "hybrid-first",
               "region": "GCC",
           },
       },
       {
           "entity": "Lumos",
           "topic": "materials",
           "facts": {
               "alloy": "Ti-6Al-4V",
               "process": "laser sintering",
               "density": "4.43 g/cm3",
               "country": "Germany",
               "use_case": "aerospace brackets",
           },
       },
       {
           "entity": "Cedar",
           "topic": "agriculture",
           "facts": {
               "crop": "wheat",
               "irrigation": "drip control",
               "country": "India",
               "yield_gain": "12 percent",
               "soil_sensor": "capacitive probe",
           },
       },
       {
           "entity": "Pulse",
           "topic": "healthcare",
           "facts": {
               "device": "ECG patch",
               "battery": "7 days",
               "country": "USA",
               "connectivity": "Bluetooth Low Energy",
               "use_case": "arrhythmia screening",
           },
       },
   ]


   phrasing_templates = [
       "{entity} in {topic} uses {value} for {slot}.",
       "The {slot} associated with {entity} is {value}.",
       "{entity} has {slot}: {value}.",
       "For {entity}, the recorded {slot} is {value}.",
       "Reference note: {entity} -> {slot} = {value}.",
   ]


   distractor_templates = [
       "{entity} was discussed in a briefing about cross-domain innovation.",
       "{entity} has been compared with several other projects in recent reports.",
       "A summary note mentions {entity} among notable initiatives.",
       "{entity} appears in a high-level update without technical details.",
       "Stakeholders reviewed {entity} in a strategic planning session.",
   ]


   memory_bank = []
   memory_id = 0


   for item in entities:
       entity = item["entity"]
       topic = item["topic"]
       for slot, value in item["facts"].items():
           for t in phrasing_templates:
               text = t.format(entity=entity, topic=topic, slot=slot, value=value)
               memory_bank.append(MemoryItem(
                   memory_id=memory_id,
                   topic=topic,
                   entity=entity,
                   slot=slot,
                   value=value,
                   text=text
               ))
               memory_id += 1


       for t in distractor_templates:
           text = t.format(entity=entity)
           memory_bank.append(MemoryItem(
               memory_id=memory_id,
               topic=topic,
               entity=entity,
               slot="distractor",
               value="n/a",
               text=text
           ))
           memory_id += 1


   extra_noise = [
       "General note: system maintenance occurred on Tuesday.",
       "A committee discussed budget timelines and operational readiness.",
       "The archive includes summaries of projects across multiple departments.",
       "No relevant technical value is stated in this memory.",
       "A status update mentioned partnerships and future opportunities.",
       "An unrelated note references shipping delays and staffing changes.",
       "Background memo: the team reviewed dashboards and reporting cadence.",
       "This memory contains no answer-bearing facts.",
   ]


   for text in extra_noise:
       memory_bank.append(MemoryItem(
           memory_id=memory_id,
           topic="noise",
           entity="none",
           slot="distractor",
           value="n/a",
           text=text
       ))
       memory_id += 1


   return memory_bank


memory_bank = build_memory_bank()
memory_texts = [m.text for m in memory_bank]
memory_embeddings = embed_texts(memory_texts)


def build_queries(memory_bank: List[MemoryItem]) -> List[Dict[str, Any]]:
   patterns = [
       "What is the {slot} of {entity}?",
       "Which {slot} does {entity} have?",
       "Tell me the {slot} for {entity}.",
       "Can you recall the {slot} associated with {entity}?",
       "What was recorded as the {slot} of {entity}?",
   ]
   queries = []
   qid = 0
   for m in memory_bank:
       if m.slot == "distractor":
           continue
       q = random.choice(patterns).format(slot=m.slot.replace("_", " "), entity=m.entity)
       queries.append({
           "query_id": qid,
           "query": q,
           "entity": m.entity,
           "slot": m.slot,
           "gold_value": m.value,
           "gold_memory_id": m.memory_id,
           "gold_text": m.text,
           "topic": m.topic,
       })
       qid += 1
   random.shuffle(queries)
   return queries


queries = build_queries(memory_bank)
query_texts = [q["query"] for q in queries]
query_embeddings = embed_texts(query_texts)

Credit: Source link

ShareTweetSendSharePin

Related Posts

Xiaomi’s Electric Supercar Threatens Porsche, Europe Models
AI & Technology

Xiaomi’s Electric Supercar Threatens Porsche, Europe Models

April 28, 2026
Why DeepSeek V4 Impresses Despite Lack of ‘Wow’ Factor
AI & Technology

Why DeepSeek V4 Impresses Despite Lack of ‘Wow’ Factor

April 28, 2026
Why Apple Picked Their Product Guy as the Next CEO
AI & Technology

Why Apple Picked Their Product Guy as the Next CEO

April 28, 2026
What Happens When AIs Work Together?
AI & Technology

What Happens When AIs Work Together?

April 28, 2026
Next Post
Open source Xiaomi MiMo-V2.5 and V2.5-Pro are among the most efficient (and affordable) at agentic ‘claw’ tasks

Open source Xiaomi MiMo-V2.5 and V2.5-Pro are among the most efficient (and affordable) at agentic 'claw' tasks

Leave a Reply Cancel reply

Your email address will not be published. Required fields are marked *

Search

No Result
View All Result
Steam Controller release date revealed as another review leaks online – Notebookcheck

Steam Controller release date revealed as another review leaks online – Notebookcheck

April 27, 2026
Build a Reinforcement Learning Powered Agent that Learns to Retrieve Relevant Long-Term Memories for Accurate LLM Question Answering

Build a Reinforcement Learning Powered Agent that Learns to Retrieve Relevant Long-Term Memories for Accurate LLM Question Answering

April 27, 2026
Cuban president says ‘if we need to die, we’ll die’ to prevent U.S. invasion: Full interview

Cuban president says ‘if we need to die, we’ll die’ to prevent U.S. invasion: Full interview

April 26, 2026

About

Learn more

Our Services

Legal

Privacy Policy

Terms of Use

Bloggers

Learn more

Article Links

Contact

Advertise

Ask us anything

©2020- TradePoint.io - All rights reserved!

Tradepoint.io, being just a publishing and technology platform, is not a registered broker-dealer or investment adviser. So we do not provide investment advice. Rather, brokerage services are provided to clients of Tradepoint.io by independent SEC-registered broker-dealers and members of FINRA/SIPC. Every form of investing carries some risk and past performance is not a guarantee of future results. “Tradepoint.io“, “Instant Investing” and “My Trading Tools” are registered trademarks of Apperbuild, LLC.

This website is operated by Apperbuild, LLC. We have no link to any brokerage firm and we do not provide investment advice. Every information and resource we provide is solely for the education of our readers. © 2020 Apperbuild, LLC. All rights reserved.

No Result
View All Result
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop

© 2023 - TradePoint.io - All Rights Reserved!