• bitcoinBitcoin(BTC)$75,769.00-2.12%
  • ethereumEthereum(ETH)$2,064.87-2.75%
  • tetherTether(USDT)$1.00-0.07%
  • binancecoinBNB(BNB)$654.81-1.08%
  • rippleXRP(XRP)$1.33-2.07%
  • usd-coinUSDC(USDC)$1.000.00%
  • solanaSolana(SOL)$83.38-2.78%
  • tronTRON(TRX)$0.3738590.33%
  • Figure HelocFigure Heloc(FIGR_HELOC)$1.031.75%
  • dogecoinDogecoin(DOGE)$0.100548-2.30%
  • HyperliquidHyperliquid(HYPE)$60.46-2.13%
  • USDSUSDS(USDS)$1.00-0.02%
  • zcashZcash(ZEC)$584.76-11.24%
  • leo-tokenLEO Token(LEO)$9.99-0.02%
  • cardanoCardano(ADA)$0.239015-2.71%
  • RainRain(RAIN)$0.01172447.14%
  • moneroMonero(XMR)$379.48-1.03%
  • bitcoin-cashBitcoin Cash(BCH)$344.09-1.73%
  • chainlinkChainlink(LINK)$9.35-2.12%
  • whitebitWhiteBIT Coin(WBT)$55.73-2.22%
  • CantonCanton(CC)$0.156548-5.06%
  • the-open-networkToncoin(TON)$1.99-1.45%
  • stellarStellar(XLM)$0.146916-2.43%
  • USD1USD1(USD1)$1.00-0.08%
  • Ethena USDeEthena USDe(USDE)$1.00-0.05%
  • daiDai(DAI)$1.00-0.01%
  • suiSui(SUI)$1.01-4.44%
  • litecoinLitecoin(LTC)$51.68-2.37%
  • avalanche-2Avalanche(AVAX)$9.13-2.72%
  • MemeCoreMemeCore(M)$2.90-0.82%
  • hedera-hashgraphHedera(HBAR)$0.086399-2.82%
  • paypal-usdPayPal USD(PYUSD)$1.000.00%
  • nearNEAR Protocol(NEAR)$2.62-4.42%
  • shiba-inuShiba Inu(SHIB)$0.000006-1.91%
  • crypto-com-chainCronos(CRO)$0.067143-3.08%
  • Circle USYCCircle USYC(USYC)$1.12-0.01%
  • Global DollarGlobal Dollar(USDG)$1.00-0.02%
  • BittensorBittensor(TAO)$279.70-0.97%
  • tether-goldTether Gold(XAUT)$4,488.51-1.31%
  • BlackRock USD Institutional Digital Liquidity FundBlackRock USD Institutional Digital Liquidity Fund(BUIDL)$1.000.00%
  • Ondo US Dollar YieldOndo US Dollar Yield(USDY)$1.130.46%
  • pax-goldPAX Gold(PAXG)$4,495.81-1.35%
  • mantleMantle(MNT)$0.64-2.64%
  • polkadotPolkadot(DOT)$1.24-2.95%
  • uniswapUniswap(UNI)$3.24-3.16%
  • OndoOndo(ONDO)$0.407343-6.48%
  • okbOKB(OKB)$89.667.41%
  • HTX DAOHTX DAO(HTX)$0.000002-0.09%
  • World Liberty FinancialWorld Liberty Financial(WLFI)$0.056873-7.85%
  • Ripple USDRipple USD(RLUSD)$1.00-0.01%
TradePoint.io
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop
No Result
View All Result
TradePoint.io
No Result
View All Result

Design a Complete Multimodal RLVR Pipeline with Open-MM-RL, Vision-Language Prompting, Reward Scoring, and GRPO Export

May 26, 2026
in AI & Technology
Reading Time: 2 mins read
A A
Design a Complete Multimodal RLVR Pipeline with Open-MM-RL, Vision-Language Prompting, Reward Scoring, and GRPO Export
ShareShareShareShareShare

YOU MAY ALSO LIKE

SpaceX Reportedly Pressured The Pentagon Into Paying More For Starlink Access

Spain Blocks Polymarket And Kalshi As It Investigates Prediction Market Platforms

EXTRACT_PATS = [
   r"\\boxed\{([^{}]+)\}",
   r"final\s+answer\s*[:=]\s*([^\n]+)",
   r"answer\s*[:=]\s*([^\n]+)",
]
def extract_final(text):
   if not text: return ""
   for p in EXTRACT_PATS:
       m = re.search(p, text, flags=re.IGNORECASE)
       if m: return m.group(1).strip().strip(".,;")
   lines = [l.strip() for l in str(text).strip().splitlines() if l.strip()]
   return lines[-1] if lines else ""
def latex_to_sympy(s):
   s = (s or "").strip().strip("$").strip()
   s = re.sub(r"^\\[\[\(]", "", s); s = re.sub(r"\\[\]\)]$", "", s)
   s = (s.replace("\\pi", "pi").replace("\\cdot", "*").replace("\\times", "*")
          .replace("\\,", "").replace("\\;", "").replace("\\!", ""))
   s = re.sub(r"\\frac\s*\{([^{}]+)\}\s*\{([^{}]+)\}", r"((\1)/(\2))", s)
   s = re.sub(r"\\sqrt\s*\{([^{}]+)\}", r"sqrt(\1)", s)
   s = s.replace("^", "**")
   s = re.sub(r"\\[a-zA-Z]+", "", s)
   s = s.replace("{", "(").replace("}", ")")
   return s
def grade(pred, gold, tol=1e-4):
   """Verifiable reward in [0,1]: exact > numeric > sympy-symbolic > partial."""
   if pred is None or gold is None: return 0.0
   p = extract_final(str(pred)).strip()
   g = str(gold).strip()
   norm = lambda x: re.sub(r"\s+", "", x.lower()).strip("$.,;[]()")
   if norm(p) == norm(g): return 1.0
   def to_float(x):
       try: return float(latex_to_sympy(x))
       except Exception:
           try: return float(sp.sympify(latex_to_sympy(x)).evalf())
           except Exception: return None
   fp, fg = to_float(p), to_float(g)
   if fp is not None and fg is not None:
       if abs(fp - fg) / max(1.0, abs(fg)) < tol: return 1.0
   try:
       ep = sp.sympify(latex_to_sympy(p)); eg = sp.sympify(latex_to_sympy(g))
       if sp.simplify(ep - eg) == 0: return 1.0
   except Exception:
       pass
   if norm(g) and norm(g) in norm(p): return 0.5
   return 0.0
print("\n=== Grader sanity checks ===")
for pred, gold, want in [
   ("The answer is \\boxed{120}",            "[120]",            1.0),
   ("After computing: 7396 \\pi",            "7396\\pi",         1.0),
   ("Final answer: -71/4",                   "-\\frac{71}{4}",   1.0),
   ("Therefore the result is 0.0074",        "0.0074",           1.0),
   ("Final answer: nucleus accumbens",       "Nucleus accumbens",1.0),
   ("I don't know",                          "12",               0.0),
]:
   print(f"  pred={pred[:38]!r:42s} gold={gold!r:22s} -> r={grade(pred, gold)}  (want {want})")
SYSTEM = ("You are a STEM expert solving multimodal reasoning problems. "
         "You will see a question and one or more figures. "
         "Reason step by step, then end with exactly one line:\n"
         "Final answer: ")
def build_prompt(ex):
   img_tags = "\n".join(f"[Image {i+1}]" for i in range(len(ex["images"])))
   return f"{SYSTEM}\n\n{img_tags}\n\nQuestion:\n{ex['question']}\n\nLet's think step by step."
print("\n=== Example prompt (truncated) ===")
print(build_prompt(ds[0])[:600], "...\n")

Credit: Source link

ShareTweetSendSharePin

Related Posts

SpaceX Reportedly Pressured The Pentagon Into Paying More For Starlink Access
AI & Technology

SpaceX Reportedly Pressured The Pentagon Into Paying More For Starlink Access

May 26, 2026
Spain Blocks Polymarket And Kalshi As It Investigates Prediction Market Platforms
AI & Technology

Spain Blocks Polymarket And Kalshi As It Investigates Prediction Market Platforms

May 26, 2026
Blue Origin Cleared To Launch New Glenn Rocket Again After FAA Investigation
AI & Technology

Blue Origin Cleared To Launch New Glenn Rocket Again After FAA Investigation

May 26, 2026
Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs
AI & Technology

Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs

May 26, 2026
Next Post
Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs

Meet OmniVoice Studio: A Local, Open-Source Alternative to ElevenLabs

Leave a Reply Cancel reply

Your email address will not be published. Required fields are marked *

Search

No Result
View All Result
My Friends Say I’ve Made a Big Financial Mistake

My Friends Say I’ve Made a Big Financial Mistake

May 20, 2026
5 judges who explain the courts’ rebuke of ICE detentions – Politico

5 judges who explain the courts’ rebuke of ICE detentions – Politico

May 24, 2026
Trump Mobile Has Exposed Customers’ Personal Data, Including Home Addresses And Phone Numbers

Trump Mobile Has Exposed Customers’ Personal Data, Including Home Addresses And Phone Numbers

May 22, 2026

About

Learn more

Our Services

Legal

Privacy Policy

Terms of Use

Bloggers

Learn more

Article Links

Contact

Advertise

Ask us anything

©2020- TradePoint.io - All rights reserved!

Tradepoint.io, being just a publishing and technology platform, is not a registered broker-dealer or investment adviser. So we do not provide investment advice. Rather, brokerage services are provided to clients of Tradepoint.io by independent SEC-registered broker-dealers and members of FINRA/SIPC. Every form of investing carries some risk and past performance is not a guarantee of future results. “Tradepoint.io“, “Instant Investing” and “My Trading Tools” are registered trademarks of Apperbuild, LLC.

This website is operated by Apperbuild, LLC. We have no link to any brokerage firm and we do not provide investment advice. Every information and resource we provide is solely for the education of our readers. © 2020 Apperbuild, LLC. All rights reserved.

No Result
View All Result
  • Main
  • AI & Technology
  • Stock Charts
  • Market & News
  • Business
  • Finance Tips
  • Trade Tube
  • Blog
  • Shop

© 2023 - TradePoint.io - All Rights Reserved!