• bitcoinBitcoin(BTC)$75,987.00-2.01%
  • ethereumEthereum(ETH)$2,072.81-2.62%
  • tetherTether(USDT)$1.00-0.06%
  • binancecoinBNB(BNB)$655.63-0.88%
  • rippleXRP(XRP)$1.33-1.91%
  • usd-coinUSDC(USDC)$1.00-0.01%
  • solanaSolana(SOL)$83.78-2.70%
  • tronTRON(TRX)$0.3740630.44%
  • Figure HelocFigure Heloc(FIGR_HELOC)$1.031.81%
  • dogecoinDogecoin(DOGE)$0.101137-1.99%
  • HyperliquidHyperliquid(HYPE)$61.56-1.02%
  • USDSUSDS(USDS)$1.00-0.06%
  • zcashZcash(ZEC)$595.14-10.85%
  • leo-tokenLEO Token(LEO)$9.97-0.16%
  • cardanoCardano(ADA)$0.240692-2.51%
  • moneroMonero(XMR)$379.96-2.00%
  • RainRain(RAIN)$0.01119340.05%
  • bitcoin-cashBitcoin Cash(BCH)$346.03-1.18%
  • chainlinkChainlink(LINK)$9.42-1.85%
  • whitebitWhiteBIT Coin(WBT)$55.91-2.15%
  • CantonCanton(CC)$0.156363-6.20%
  • the-open-networkToncoin(TON)$1.95-4.92%
  • stellarStellar(XLM)$0.147769-2.10%
  • USD1USD1(USD1)$1.00-0.09%
  • Ethena USDeEthena USDe(USDE)$1.00-0.03%
  • daiDai(DAI)$1.000.01%
  • suiSui(SUI)$1.01-4.26%
  • litecoinLitecoin(LTC)$51.95-1.92%
  • avalanche-2Avalanche(AVAX)$9.19-2.53%
  • MemeCoreMemeCore(M)$2.88-1.61%
  • hedera-hashgraphHedera(HBAR)$0.086963-2.12%
  • paypal-usdPayPal USD(PYUSD)$1.00-0.03%
  • nearNEAR Protocol(NEAR)$2.64-3.29%
  • shiba-inuShiba Inu(SHIB)$0.000006-1.95%
  • crypto-com-chainCronos(CRO)$0.067666-2.72%
  • Circle USYCCircle USYC(USYC)$1.12-0.01%
  • Global DollarGlobal Dollar(USDG)$1.00-0.01%
  • BittensorBittensor(TAO)$283.931.46%
  • tether-goldTether Gold(XAUT)$4,481.17-1.48%
  • BlackRock USD Institutional Digital Liquidity FundBlackRock USD Institutional Digital Liquidity Fund(BUIDL)$1.000.00%
  • Ondo US Dollar YieldOndo US Dollar Yield(USDY)$1.13-0.11%
  • polkadotPolkadot(DOT)$1.26-2.42%
  • pax-goldPAX Gold(PAXG)$4,488.77-1.52%
  • mantleMantle(MNT)$0.64-2.82%
  • uniswapUniswap(UNI)$3.25-3.21%
  • OndoOndo(ONDO)$0.412977-6.20%
  • okbOKB(OKB)$89.417.18%
  • HTX DAOHTX DAO(HTX)$0.0000020.57%
  • Ripple USDRipple USD(RLUSD)$1.000.00%
  • AsterAster(ASTER)$0.68-2.54%
TradePoint.io
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop
No Result
View All Result
TradePoint.io
No Result
View All Result

Design a Complete Multimodal RLVR Pipeline with Open-MM-RL, Vision-Language Prompting, Reward Scoring, and GRPO Export

May 26, 2026
in AI & Technology
Reading Time: 2 mins read
A A
Design a Complete Multimodal RLVR Pipeline with Open-MM-RL, Vision-Language Prompting, Reward Scoring, and GRPO Export
ShareShareShareShareShare

YOU MAY ALSO LIKE

Spain Blocks Polymarket And Kalshi As It Investigates Prediction Market Platforms

Blue Origin Cleared To Launch New Glenn Rocket Again After FAA Investigation

EXTRACT_PATS = [
   r"\\boxed\{([^{}]+)\}",
   r"final\s+answer\s*[:=]\s*([^\n]+)",
   r"answer\s*[:=]\s*([^\n]+)",
]
def extract_final(text):
   if not text: return ""
   for p in EXTRACT_PATS:
       m = re.search(p, text, flags=re.IGNORECASE)
       if m: return m.group(1).strip().strip(".,;")
   lines = [l.strip() for l in str(text).strip().splitlines() if l.strip()]
   return lines[-1] if lines else ""
def latex_to_sympy(s):
   s = (s or "").strip().strip("$").strip()
   s = re.sub(r"^\\[\[\(]", "", s); s = re.sub(r"\\[\]\)]$", "", s)
   s = (s.replace("\\pi", "pi").replace("\\cdot", "*").replace("\\times", "*")
          .replace("\\,", "").replace("\\;", "").replace("\\!", ""))
   s = re.sub(r"\\frac\s*\{([^{}]+)\}\s*\{([^{}]+)\}", r"((\1)/(\2))", s)
   s = re.sub(r"\\sqrt\s*\{([^{}]+)\}", r"sqrt(\1)", s)
   s = s.replace("^", "**")
   s = re.sub(r"\\[a-zA-Z]+", "", s)
   s = s.replace("{", "(").replace("}", ")")
   return s
def grade(pred, gold, tol=1e-4):
   """Verifiable reward in [0,1]: exact > numeric > sympy-symbolic > partial."""
   if pred is None or gold is None: return 0.0
   p = extract_final(str(pred)).strip()
   g = str(gold).strip()
   norm = lambda x: re.sub(r"\s+", "", x.lower()).strip("$.,;[]()")
   if norm(p) == norm(g): return 1.0
   def to_float(x):
       try: return float(latex_to_sympy(x))
       except Exception:
           try: return float(sp.sympify(latex_to_sympy(x)).evalf())
           except Exception: return None
   fp, fg = to_float(p), to_float(g)
   if fp is not None and fg is not None:
       if abs(fp - fg) / max(1.0, abs(fg)) < tol: return 1.0
   try:
       ep = sp.sympify(latex_to_sympy(p)); eg = sp.sympify(latex_to_sympy(g))
       if sp.simplify(ep - eg) == 0: return 1.0
   except Exception:
       pass
   if norm(g) and norm(g) in norm(p): return 0.5
   return 0.0
print("\n=== Grader sanity checks ===")
for pred, gold, want in [
   ("The answer is \\boxed{120}",            "[120]",            1.0),
   ("After computing: 7396 \\pi",            "7396\\pi",         1.0),
   ("Final answer: -71/4",                   "-\\frac{71}{4}",   1.0),
   ("Therefore the result is 0.0074",        "0.0074",           1.0),
   ("Final answer: nucleus accumbens",       "Nucleus accumbens",1.0),
   ("I don't know",                          "12",               0.0),
]:
   print(f"  pred={pred[:38]!r:42s} gold={gold!r:22s} -> r={grade(pred, gold)}  (want {want})")
SYSTEM = ("You are a STEM expert solving multimodal reasoning problems. "
         "You will see a question and one or more figures. "
         "Reason step by step, then end with exactly one line:\n"
         "Final answer: ")
def build_prompt(ex):
   img_tags = "\n".join(f"[Image {i+1}]" for i in range(len(ex["images"])))
   return f"{SYSTEM}\n\n{img_tags}\n\nQuestion:\n{ex['question']}\n\nLet's think step by step."
print("\n=== Example prompt (truncated) ===")
print(build_prompt(ds[0])[:600], "...\n")

Credit: Source link

ShareTweetSendSharePin

Related Posts

Spain Blocks Polymarket And Kalshi As It Investigates Prediction Market Platforms
AI & Technology

Spain Blocks Polymarket And Kalshi As It Investigates Prediction Market Platforms

May 26, 2026
Blue Origin Cleared To Launch New Glenn Rocket Again After FAA Investigation
AI & Technology

Blue Origin Cleared To Launch New Glenn Rocket Again After FAA Investigation

May 26, 2026
Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs
AI & Technology

Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs

May 26, 2026
Sennheiser’s Momentum 5 Headphones Are All About The Audio And ANC Upgrades
AI & Technology

Sennheiser’s Momentum 5 Headphones Are All About The Audio And ANC Upgrades

May 25, 2026
Next Post
Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs

Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs

Leave a Reply Cancel reply

Your email address will not be published. Required fields are marked *

Search

No Result
View All Result
What Comes Next After SpaceX Halts Starship Launch

What Comes Next After SpaceX Halts Starship Launch

May 24, 2026
Google co-founder throws 0K at anti ‘Overpaid CEO Tax’ campaign

Google co-founder throws $500K at anti ‘Overpaid CEO Tax’ campaign

May 20, 2026
100% ROI OSCR Full Analysis | Buy, Sell, or Short This Stock?

100% ROI OSCR Full Analysis | Buy, Sell, or Short This Stock?

May 22, 2026

About

Learn more

Our Services

Legal

Privacy Policy

Terms of Use

Bloggers

Learn more

Article Links

Contact

Advertise

Ask us anything

©2020- TradePoint.io - All rights reserved!

Tradepoint.io, being just a publishing and technology platform, is not a registered broker-dealer or investment adviser. So we do not provide investment advice. Rather, brokerage services are provided to clients of Tradepoint.io by independent SEC-registered broker-dealers and members of FINRA/SIPC. Every form of investing carries some risk and past performance is not a guarantee of future results. “Tradepoint.io“, “Instant Investing” and “My Trading Tools” are registered trademarks of Apperbuild, LLC.

This website is operated by Apperbuild, LLC. We have no link to any brokerage firm and we do not provide investment advice. Every information and resource we provide is solely for the education of our readers. © 2020 Apperbuild, LLC. All rights reserved.

No Result
View All Result
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop

© 2023 - TradePoint.io - All Rights Reserved!