<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Finance on serhii.net</title>
    <link>https://serhii.net/tags/finance/</link>
    <description>Recent content in Finance on serhii.net</description>
    <generator>Hugo</generator>
    <language>en-us</language>
    <copyright>Serhii Hamotskyi / serhii.net</copyright>
    <lastBuildDate>Sat, 16 May 2026 00:00:00 +0200</lastBuildDate>
    <atom:link href="https://serhii.net/tags/finance/index.xml" rel="self" type="application/rss+xml" />
    <item>
      <title>FNP-2026 at LREC paper notes</title>
      <link>https://serhii.net/dtb/260516-1107-fnp-2026-at-lrec-paper-notes/</link>
      <pubDate>Sat, 16 May 2026 00:00:00 +0200</pubDate>
      <guid>https://serhii.net/dtb/260516-1107-fnp-2026-at-lrec-paper-notes/</guid>
      <description>&lt;ul&gt;&#xA;&lt;li&gt;&lt;a href=&#34;https://wp.lancs.ac.uk/cfie/fnp2026/&#34;&gt;FNP – FNP 2026&lt;/a&gt;&lt;/li&gt;&#xA;&lt;li&gt;FNP 2026 &lt;a href=&#34;http://lrec-conf.org/proceedings/lrec2026/workshops/fnp/2026.fnp-1.0.pdf&#34;&gt;proceedings&lt;/a&gt; PDF.&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;h3 id=&#34;when-tables-go-crazy-evaluating-multimodal-models-on-french-financial-documents&#34;&gt;When Tables Go Crazy: Evaluating Multimodal Models on French Financial Documents&lt;/h3&gt;&#xA;&lt;ul&gt;&#xA;&lt;li&gt;Links&#xA;&lt;ul&gt;&#xA;&lt;li&gt;&lt;a href=&#34;https://arxiv.org/abs/2602.10384&#34;&gt;[2602.10384] When Tables Go Crazy: Evaluating Multimodal Models on French Financial Documents&lt;/a&gt;&lt;/li&gt;&#xA;&lt;li&gt;&lt;a href=&#34;https://github.com/dseddah/Scribe_finance&#34;&gt;Github&lt;/a&gt; contains both dataset and scripts!&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;/li&gt;&#xA;&lt;li&gt;Benchmark French visual finance docs, includes evaluation on multiple VLMs&#xA;&lt;ul&gt;&#xA;&lt;li&gt;Chart checkboxes graphs and weird edge cases specifically present&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;/li&gt;&#xA;&lt;li&gt;Bits&#xA;&lt;ul&gt;&#xA;&lt;li&gt;LLMs when asked to generate questions usually generate only questions they have answers to&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;h3 id=&#34;cfqa-a-chinese-financial-question-answering-benchmark-from-corporate-annual-reports&#34;&gt;CFQA: A Chinese Financial Question Answering Benchmark from Corporate Annual Reports&lt;/h3&gt;&#xA;&lt;ul&gt;&#xA;&lt;li&gt;Links:&#xA;&lt;ul&gt;&#xA;&lt;li&gt;&lt;a href=&#34;https://huggingface.co/datasets/ZackZhu00/CFQA_Chinese_Finance_Question_Answering&#34;&gt;ZackZhu00/CFQA_Chinese_Finance_Question_Answering · Datasets at Hugging Face&lt;/a&gt;&lt;/li&gt;&#xA;&lt;li&gt;&lt;a href=&#34;https://github.com/zhutianning/Hallucination-detection-for-RAG&#34;&gt;zhutianning/Hallucination-detection-for-RAG: This project aims to design and implement a hallucination detection and evaluation pipeline for Retrieval- Augmented Generation (RAG) systems processing multi-modal financial reports (text, tables, images/charts).&lt;/a&gt;&lt;/li&gt;&#xA;&lt;li&gt;Unclear relation:&#xA;&lt;ul&gt;&#xA;&lt;li&gt;&lt;a href=&#34;https://github.com/ygan/CFQA&#34;&gt;Github&lt;/a&gt; (?) / &lt;a href=&#34;https://link.springer.com/article/10.1140/epjds/s13688-025-00601-6#Sec17&#34;&gt;Addressing investor concerns: a Chinese financial question-answering benchmark with LLM-based evaluation | EPJ Data Science | Springer Nature Link&lt;/a&gt; (??)&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;/li&gt;&#xA;&lt;li&gt;Takeaway&#xA;&lt;ul&gt;&#xA;&lt;li&gt;RAG decreases hallucinations and improves fact extraction scores but not clear for other tasks involving reasoning, and decrease scores w/ some model[s&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;h3 id=&#34;-verifiable-financial-enterprise-question-answering-via-inference-time-grounding-and-traceability&#34;&gt;(!) Verifiable Financial Enterprise Question Answering via Inference-Time Grounding and Traceability&lt;/h3&gt;&#xA;&lt;ul&gt;&#xA;&lt;li&gt;LLMs grounding verifiable citations&lt;/li&gt;&#xA;&lt;li&gt;Framework, modular, real-time&lt;/li&gt;&#xA;&lt;li&gt;Verify citations and fix citation drift by looking at ovelaps/presence w/ source documents.&#xA;&lt;ul&gt;&#xA;&lt;li&gt;&lt;strong&gt;Sentence-level citations&lt;/strong&gt; allegedly lead to better groundedness&lt;/li&gt;&#xA;&lt;/ul&gt;&#xA;&lt;/li&gt;&#xA;&lt;li&gt;&lt;strong&gt;TODO&lt;/strong&gt; Many many interesting citations to parse&#xA;&#xA;  &lt;img src=&#34;https://serhii.net/assets/pasted-image-20260516114801.png&#34; alt=&#34;Pasted image 20260516114801.png&#34;&gt;&#xA;&#xA;&lt;/li&gt;&#xA;&lt;li&gt;Related paper I just found: &lt;a href=&#34;https://arxiv.org/abs/2604.23588&#34;&gt;[2604.23588] FinGround: Detecting and Grounding Financial Hallucinations via Atomic Claim Verification&lt;/a&gt;&lt;/li&gt;&#xA;&lt;/ul&gt;</description>
    </item>
  </channel>
</rss>
