For a complete understanding of Extract outputs, see Extract
Outputs. For configuration options, see
Extract Overview.
Financial Report
Extract key financial metrics and data from financial statements, earnings reports, and other financial documents.Schema
Copy
Ask AI
import os
from typing import List, Optional
from chunkr_ai import Chunkr
from pydantic import BaseModel, Field
class FinancialPositionItem(BaseModel):
category: str
subcategory: Optional[str]
account_name: str
amount: float
class FinancialPositionPeriod(BaseModel):
as_of_date: str = Field(description="Date for this financial position snapshot")
items: List[FinancialPositionItem]
class StatementOfFinancialPosition(BaseModel):
currency: str
periods: List[FinancialPositionPeriod]
class ProfitOrLossItem(BaseModel):
account_name: str = Field(description="Name of the profit and loss account")
amount: float
class StatementOfProfitAndLoss(BaseModel):
period_start: str
period_end: str
currency: str
items: List[ProfitOrLossItem] = Field(description="List of profit and loss items")
net_income: float = Field(description="Total net income for this period")
class ComprehensiveIncomeItem(BaseModel):
account_name: str = Field(description="Name of the comprehensive income account")
amount: float = Field(description="Monetary value in the statement's base currency")
class ComprehensiveIncomePeriod(BaseModel):
period_end: str = Field(description="Ending date for this period (YYYY-MM-DD)")
items: List[ComprehensiveIncomeItem]
total_comprehensive_income: float
class StatementOfComprehensiveIncome(BaseModel):
currency: str
periods: List[ComprehensiveIncomePeriod]
class EquityChangeItem(BaseModel):
component: str = Field(description="Name of the equity component")
opening_balance: float = Field(description="Balance at the beginning of the period")
changes: List[str] = Field(description="Descriptions of changes during the period")
closing_balance: float = Field(description="Balance at the end of the period")
class StatementOfChangesInEquity(BaseModel):
period_end: str
currency: str
items: List[EquityChangeItem]
class CashFlowItem(BaseModel):
activity_type: str = Field(description="Type of cash flow activity")
account_name: str = Field(description="Name of the cash flow account")
amount: float
class CashFlowPeriod(BaseModel):
period_end: str
items: List[CashFlowItem] = Field(description="List of cash flow items")
net_increase_in_cash: float = Field(description="Net increase for this period")
closing_cash_balance: float = Field(description="Balance at the end of this period")
class StatementOfCashFlows(BaseModel):
currency: str
periods: List[CashFlowPeriod] = Field(description="List of cash flow periods")
class FinancialReport(BaseModel):
entity_name: str = Field(description="Name of the reporting entity")
report_title: Optional[str]
reporting_period_start: Optional[str]
reporting_period_end: Optional[str]
reporting_as_of_date: Optional[str]
currency: str
statement_of_financial_position: Optional[StatementOfFinancialPosition]
statement_of_profit_or_loss: Optional[StatementOfProfitAndLoss]
statement_of_comprehensive_income: Optional[StatementOfComprehensiveIncome]
statement_of_changes_in_equity: Optional[StatementOfChangesInEquity]
statement_of_cash_flows: Optional[StatementOfCashFlows]
Process
Copy
Ask AI
# Convert Pydantic model to JSON schema
schema = FinancialReport.model_json_schema()
client = Chunkr(api_key=os.environ["CHUNKR_API_KEY"])
# Create extract task
task = client.tasks.extract.create(
file="https://s3.us-east-1.amazonaws.com/chunkr-web/uploads/financial_report.pdf",
schema=schema,
)
Output
Copy
Ask AI
{
"currency": "JPY",
"entity_name": "SoftBank Group Corp.",
"report_title": "Consolidated Financial Report For the Fiscal Year Ended March 31, 2025",
"reporting_as_of_date": "2025-03-31",
"reporting_period_end": "2025-03-31",
"reporting_period_start": "2024-04-01",
"statement_of_cash_flows": {
"currency": "JPY",
"periods": [
{
"closing_cash_balance": 3713028,
"items": [
{
"account_name": "Net income",
"activity_type": "Operating Activities",
"amount": 1603108
},
{
"account_name": "Depreciation and amortization",
"activity_type": "Operating Activities",
"amount": 866823
},
{
"account_name": "Loss (gain) on investments at Investment Business of Holding Companies",
"activity_type": "Operating Activities",
"amount": -3422188
},
{
"account_name": "Loss (gain) on investments at SoftBank Vision Funds",
"activity_type": "Operating Activities",
"amount": -387584
},
{
"account_name": "Finance cost",
"activity_type": "Operating Activities",
"amount": 581559
},
{
"account_name": "Foreign exchange loss (gain)",
"activity_type": "Operating Activities",
"amount": -27055
},
{
"account_name": "Derivative (gain) loss (excluding (gain) loss on investments)",
"activity_type": "Operating Activities",
"amount": 2034029
},
{
"account_name": "Change in third-party interests in SVF",
"activity_type": "Operating Activities",
"amount": 491898
},
{
"account_name": "(Gain) loss on other investments and other gain",
"activity_type": "Operating Activities",
"amount": -253953
},
{
"account_name": "Income taxes",
"activity_type": "Operating Activities",
"amount": 101613
},
{
"account_name": "Increase in investments from asset management subsidiaries",
"activity_type": "Operating Activities",
"amount": -769572
},
{
"account_name": "Increase in trade and other receivables",
"activity_type": "Operating Activities",
"amount": -508544
},
{
"account_name": "Decrease (increase) in inventories",
"activity_type": "Operating Activities",
"amount": -40000
},
{
"account_name": "Increase in trade and other payables",
"activity_type": "Operating Activities",
"amount": 237030
},
{
"account_name": "Other",
"activity_type": "Operating Activities",
"amount": 93974
},
{
"account_name": "Interest and dividends received",
"activity_type": "Operating Activities",
"amount": 299714
},
{
"account_name": "Interest paid",
"activity_type": "Operating Activities",
"amount": -482111
},
{
"account_name": "Income taxes paid",
"activity_type": "Operating Activities",
"amount": -380008
},
{
"account_name": "Income taxes refunded",
"activity_type": "Operating Activities",
"amount": 164847
},
{
"account_name": "Payments for acquisition of investments",
"activity_type": "Investing Activities",
"amount": -1625245
},
{
"account_name": "Proceeds from sales/redemption of investments",
"activity_type": "Investing Activities",
"amount": 1180746
},
{
"account_name": "Payments for acquisition of investments by SVF",
"activity_type": "Investing Activities",
"amount": -578927
},
{
"account_name": "Proceeds from sales of investments by SVF",
"activity_type": "Investing Activities",
"amount": 458319
},
{
"account_name": "Payments (net) for acquisition of control over subsidiaries",
"activity_type": "Investing Activities",
"amount": -194216
},
{
"account_name": "Proceeds (net) from loss of control over subsidiaries",
"activity_type": "Investing Activities",
"amount": 94862
},
{
"account_name": "Purchase of property, plant and equipment, and intangible assets",
"activity_type": "Investing Activities",
"amount": -854173
},
{
"account_name": "Payments for loan receivables",
"activity_type": "Investing Activities",
"amount": -36538
},
{
"account_name": "Collection of loan receivables",
"activity_type": "Investing Activities",
"amount": 119384
},
{
"account_name": "Payments into time deposits",
"activity_type": "Investing Activities",
"amount": -139211
},
{
"account_name": "Proceeds from withdrawal of time deposits",
"activity_type": "Investing Activities",
"amount": 166897
},
{
"account_name": "Other",
"activity_type": "Investing Activities",
"amount": -223438
},
{
"account_name": "Proceeds in (repayment of) short-term interest-bearing debt, net",
"activity_type": "Financing Activities",
"amount": -421723
},
{
"account_name": "Proceeds from interest-bearing debt",
"activity_type": "Financing Activities",
"amount": 5313665
},
{
"account_name": "Repayment of interest-bearing debt",
"activity_type": "Financing Activities",
"amount": -3809082
},
{
"account_name": "Repayment of lease liabilities",
"activity_type": "Financing Activities",
"amount": -186441
},
{
"account_name": "Distribution/repayment from SVF to third-party investors",
"activity_type": "Financing Activities",
"amount": -1485774
},
{
"account_name": "Purchase of shares of subsidiaries from non-controlling interests",
"activity_type": "Financing Activities",
"amount": -79581
},
{
"account_name": "Distribution to owners of other equity instruments",
"activity_type": "Financing Activities",
"amount": -18867
},
{
"account_name": "Proceeds from the issuance of other equity instruments in subsidiaries",
"activity_type": "Financing Activities",
"amount": 200000
},
{
"account_name": "Purchase of treasury stock",
"activity_type": "Financing Activities",
"amount": -237058
},
{
"account_name": "Cash dividends paid",
"activity_type": "Financing Activities",
"amount": -64020
},
{
"account_name": "Cash dividends paid to non-controlling interests",
"activity_type": "Financing Activities",
"amount": -368678
},
{
"account_name": "Other",
"activity_type": "Financing Activities",
"amount": 41175
},
{
"account_name": "Effect of exchange rate changes on cash and cash equivalents",
"activity_type": "Other",
"amount": 37487
},
{
"account_name": "(Decrease) increase in cash and cash equivalents relating to transfer of assets classified as held for sale",
"activity_type": "Other",
"amount": 33011
}
],
"net_increase_in_cash": -2473846,
"period_end": "2025-03-31"
}
]
},
"statement_of_changes_in_equity": {
"currency": "JPY",
"items": [
{
"changes": [],
"closing_balance": 238772,
"component": "Common stock",
"opening_balance": 238772
},
{
"changes": [
"Changes in interests in subsidiaries",
"Share-based payment transactions",
"Other"
],
"closing_balance": 3376724,
"component": "Capital surplus",
"opening_balance": 3326093
},
{
"changes": [],
"closing_balance": 193199,
"component": "Other equity instruments",
"opening_balance": 193199
},
{
"changes": [
"Net income",
"Cash dividends",
"Distribution to owners of other equity instruments",
"Transfer of accumulated other comprehensive income to retained earnings",
"Purchase and disposal of treasury stock"
],
"closing_balance": 2701792,
"component": "Retained earnings",
"opening_balance": 1632966
},
{
"changes": [
"Purchase and disposal of treasury stock"
],
"closing_balance": -256251,
"component": "Treasury stock",
"opening_balance": -22725
},
{
"changes": [
"Other comprehensive income",
"Transfer of accumulated other comprehensive income to retained earnings"
],
"closing_balance": 5307305,
"component": "Accumulated other comprehensive income",
"opening_balance": 5793820
},
{
"changes": [
"Net income",
"Other comprehensive income",
"Cash dividends",
"Changes from loss of control",
"Changes in interests in subsidiaries",
"Issuance of other equity instruments in subsidiaries",
"Share-based payment transactions",
"Other"
],
"closing_balance": 2391485,
"component": "Non-controlling interests",
"opening_balance": 2075044
}
],
"period_end": "2025-03-31"
},
"statement_of_comprehensive_income": {
"currency": "JPY",
"periods": [
{
"items": [
{
"account_name": "Net income",
"amount": 1603108
},
{
"account_name": "Remeasurements of defined benefit plan",
"amount": 2598
},
{
"account_name": "Equity financial assets at FVTOCI",
"amount": -13757
},
{
"account_name": "Share of other comprehensive income of associates",
"amount": 162
},
{
"account_name": "Debt financial assets at FVTOCI",
"amount": -2373
},
{
"account_name": "Cash flow hedges",
"amount": 42263
},
{
"account_name": "Exchange differences on translating foreign operations",
"amount": -547774
},
{
"account_name": "Share of other comprehensive income of associates",
"amount": -1879
},
{
"account_name": "Total comprehensive income attributable to Owners of the parent",
"amount": 666237
},
{
"account_name": "Total comprehensive income attributable to Non-controlling interests",
"amount": 416111
}
],
"period_end": "2025-03-31",
"total_comprehensive_income": 1082348
}
]
},
"statement_of_financial_position": {
"currency": "JPY",
"periods": [
{
"as_of_date": "2024-03-31",
"items": [
{
"account_name": "Cash and cash equivalents",
"amount": 6186874,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Trade and other receivables",
"amount": 2868767,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Derivative financial assets",
"amount": 852350,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Other financial assets",
"amount": 777996,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Inventories",
"amount": 161863,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Other current assets",
"amount": 550984,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Assets classified as held for sale",
"amount": 42559,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Property, plant and equipment",
"amount": 1895289,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Right-of-use assets",
"amount": 746903,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Goodwill",
"amount": 5709874,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Intangible assets",
"amount": 2448840,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Costs to obtain contracts",
"amount": 317650,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Investments accounted for using the equity method",
"amount": 839208,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Investments from SVF (FVTPL)",
"amount": 11014487,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Investment securities",
"amount": 9061972,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Derivative financial assets",
"amount": 385528,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Other financial assets",
"amount": 2424282,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Deferred tax assets",
"amount": 245954,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Other non-current assets",
"amount": 192863,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Interest-bearing debt",
"amount": 8271143,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Lease liabilities",
"amount": 149801,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Deposits for banking business",
"amount": 1643155,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Trade and other payables",
"amount": 2710529,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Derivative financial liabilities",
"amount": 195090,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Other financial liabilities",
"amount": 31801,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Income taxes payable",
"amount": 163226,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Provisions",
"amount": 44704,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Other current liabilities",
"amount": 801285,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Liabilities directly relating to assets classified as held for sale",
"amount": 9561,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Interest-bearing debt",
"amount": 12296381,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Lease liabilities",
"amount": 644706,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Third-party interests in SVF",
"amount": 4694503,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Derivative financial liabilities",
"amount": 41238,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Other financial liabilities",
"amount": 57017,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Provisions",
"amount": 167902,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Deferred tax liabilities",
"amount": 1253039,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Other non-current liabilities",
"amount": 311993,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Common stock",
"amount": 238772,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Capital surplus",
"amount": 3326093,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Other equity instruments",
"amount": 193199,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Retained earnings",
"amount": 1632966,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Treasury stock",
"amount": -22725,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Accumulated other comprehensive income",
"amount": 5793820,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Non-controlling interests",
"amount": 2075044,
"category": "Equity",
"subcategory": "Non-controlling interests"
}
]
},
{
"as_of_date": "2025-03-31",
"items": [
{
"account_name": "Cash and cash equivalents",
"amount": 3713028,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Trade and other receivables",
"amount": 3008144,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Derivative financial assets",
"amount": 111258,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Other financial assets",
"amount": 1485877,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Inventories",
"amount": 198291,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Other current assets",
"amount": 365880,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Assets classified as held for sale",
"amount": 550440,
"category": "Assets",
"subcategory": "Current assets"
},
{
"account_name": "Property, plant and equipment",
"amount": 2830185,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Right-of-use assets",
"amount": 857961,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Goodwill",
"amount": 5781931,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Intangible assets",
"amount": 2414562,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Costs to obtain contracts",
"amount": 383022,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Investments accounted for using the equity method",
"amount": 502995,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Investments from SVF (FVTPL)",
"amount": 11410922,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Investment securities",
"amount": 8040068,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Derivative financial assets",
"amount": 168248,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Other financial assets",
"amount": 2767625,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Deferred tax assets",
"amount": 207987,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Other non-current assets",
"amount": 215332,
"category": "Assets",
"subcategory": "Non-current assets"
},
{
"account_name": "Interest-bearing debt",
"amount": 5629648,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Lease liabilities",
"amount": 165355,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Deposits for banking business",
"amount": 1795965,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Trade and other payables",
"amount": 3036349,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Derivative financial liabilities",
"amount": 840469,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Other financial liabilities",
"amount": 5940,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Income taxes payable",
"amount": 444180,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Provisions",
"amount": 54047,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Other current liabilities",
"amount": 629717,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Liabilities directly relating to assets classified as held for sale",
"amount": 0,
"category": "Liabilities",
"subcategory": "Current liabilities"
},
{
"account_name": "Interest-bearing debt",
"amount": 12376682,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Lease liabilities",
"amount": 741665,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Third-party interests in SVF",
"amount": 3652797,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Derivative financial liabilities",
"amount": 104197,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Other financial liabilities",
"amount": 199284,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Provisions",
"amount": 155436,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Deferred tax liabilities",
"amount": 924392,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Other non-current liabilities",
"amount": 304607,
"category": "Liabilities",
"subcategory": "Non-current liabilities"
},
{
"account_name": "Common stock",
"amount": 238772,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Capital surplus",
"amount": 3376724,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Other equity instruments",
"amount": 193199,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Retained earnings",
"amount": 2701792,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Treasury stock",
"amount": -256251,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Accumulated other comprehensive income",
"amount": 5307305,
"category": "Equity",
"subcategory": "Equity attributable to owners of the parent"
},
{
"account_name": "Non-controlling interests",
"amount": 2391485,
"category": "Equity",
"subcategory": "Non-controlling interests"
}
]
}
]
},
"statement_of_profit_or_loss": {
"currency": "JPY",
"items": [
{
"account_name": "Net sales",
"amount": 7243752
},
{
"account_name": "Cost of sales",
"amount": -3489549
},
{
"account_name": "Gross profit",
"amount": 3754203
},
{
"account_name": "Gain (loss) on investments at Investment Business of Holding Companies",
"amount": 3413821
},
{
"account_name": "Gain (loss) on investments at SoftBank Vision Funds",
"amount": 387584
},
{
"account_name": "Gain (loss) on other investments",
"amount": -100298
},
{
"account_name": "Total gain on investments",
"amount": 3701107
},
{
"account_name": "Selling, general and administrative expenses",
"amount": -3024409
},
{
"account_name": "Finance cost",
"amount": -581559
},
{
"account_name": "Foreign exchange gain (loss)",
"amount": 27055
},
{
"account_name": "Derivative gain (loss) (excluding gain (loss) on investments)",
"amount": -2034029
},
{
"account_name": "Change in third-party interests in SVF",
"amount": -491898
},
{
"account_name": "Other gain",
"amount": 354251
},
{
"account_name": "Income before income tax",
"amount": 1704721
},
{
"account_name": "Income taxes",
"amount": -101613
},
{
"account_name": "Net income attributable to Owners of the parent",
"amount": 1153332
},
{
"account_name": "Net income attributable to Non-controlling interests",
"amount": 449776
},
{
"account_name": "Basic earnings per share (Yen)",
"amount": 780.82
},
{
"account_name": "Diluted earnings per share (Yen)",
"amount": 779.4
}
],
"net_income": 1603108,
"period_end": "2025-03-31",
"period_start": "2024-04-01"
}
}
Citations
Citations
Copy
Ask AI
{
"currency": [
{
"bboxes": [
{
"height": 809.6256103515625,
"left": 110.3904037475586,
"top": 153.60479736328125,
"width": 972.6048583984376
}
],
"citation_id": "H6umuS8",
"citation_type": "Segment",
"content": "<table>\n<tr>\n<td></td>\n<td colspan=\"2\">(Millions of yen)</td>\n</tr>\n<tr>\n<td></td>\n<td>As of March 31, 2024</td>\n<td>As of March 31, 2025</td>\n</tr>\n<tr>\n<td>Assets</td>\n<td></td>\n<td></td>\n</tr>\n<tr>\n<td>Current assets</td>\n<td></td>\n<td></td>\n</tr>\n<tr>\n<td>Cash and cash equivalents</td>\n<td>6,186,874</td>\n<td>3,713,028</td>\n</tr>\n<tr>\n<td>Trade and other receivables</td>\n<td>2,868,767</td>\n<td>3,008,144</td>\n</tr>\n<tr>\n<td>Derivative financial assets</td>\n<td>852,350</td>\n<td>111,258</td>\n</tr>\n<tr>\n<td>Other financial assets</td>\n<td>777,996</td>\n<td>1,485,877</td>\n</tr>\n<tr>\n<td>Inventories</td>\n<td>161,863</td>\n<td>198,291</td>\n</tr>\n<tr>\n<td>Other current assets</td>\n<td>550,984</td>\n<td>365,880</td>\n</tr>\n<tr>\n<td>Subtotal</td>\n<td>11,398,834</td>\n<td>8,882,478</td>\n</tr>\n<tr>\n<td>Assets classified as held for sale</td>\n<td>42,559</td>\n<td>550,440</td>\n</tr>\n<tr>\n<td>Total current assets</td>\n<td>11,441,393</td>\n<td>9,432,918</td>\n</tr>\n<tr>\n<td>Non-current assets</td>\n<td></td>\n<td></td>\n</tr>\n<tr>\n<td>Property, plant and equipment</td>\n<td>1,895,289</td>\n<td>2,830,185</td>\n</tr>\n<tr>\n<td>Right-of-use assets</td>\n<td>746,903</td>\n<td>857,961</td>\n</tr>\n<tr>\n<td>Goodwill</td>\n<td>5,709,874</td>\n<td>5,781,931</td>\n</tr>\n<tr>\n<td>Intangible assets</td>\n<td>2,448,840</td>\n<td>2,414,562</td>\n</tr>\n<tr>\n<td>Costs to obtain contracts</td>\n<td>317,650</td>\n<td>383,022</td>\n</tr>\n<tr>\n<td>Investments accounted for using the equity method</td>\n<td>839,208</td>\n<td>502,995</td>\n</tr>\n<tr>\n<td>Investments from SVF (FVTPL)</td>\n<td>11,014,487</td>\n<td>11,410,922</td>\n</tr>\n<tr>\n<td>Investment securities</td>\n<td>9,061,972</td>\n<td>8,040,068</td>\n</tr>\n<tr>\n<td>Derivative financial assets</td>\n<td>385,528</td>\n<td>168,248</td>\n</tr>\n<tr>\n<td>Other financial assets</td>\n<td>2,424,282</td>\n<td>2,767,625</td>\n</tr>\n<tr>\n<td>Deferred tax assets</td>\n<td>245,954</td>\n<td>207,987</td>\n</tr>\n<tr>\n<td>Other non-current assets</td>\n<td>192,863</td>\n<td>215,332</td>\n</tr>\n<tr>\n<td>Total non-current assets</td>\n<td>35,282,850</td>\n<td>35,580,838</td>\n</tr>\n<tr>\n<td>Total assets</td>\n<td>46,724,243</td>\n<td>45,013,756</td>\n</tr>\n</table>",
"page_height": 1683.99365234375,
"page_number": 1,
"page_width": 1190.0015869140625,
"segment_id": "wgSqyhR",
"segment_type": "Table"
},
{
"bboxes": [
{
"height": 20.534393310546875,
"left": 934.0416259765624,
"top": 2.8944091796875,
"width": 33.724853515625
}
],
"citation_id": "PfSpVmO",
"citation_type": "Word",
"content": "yen)",
"page_height": 1683.99365234375,
"page_number": 1,
"page_width": 1190.0015869140625,
"segment_id": null,
"segment_type": "Text"
},
// .. more citations
],
"entity_name": [
{
"bboxes": [
{
"height": 36.99359893798828,
"left": 792.4896240234375,
"top": 48.959999084472656,
"width": 347.1983642578125
}
],
"citation_id": "z9EfpZH",
"citation_type": "Segment",
"content": "SoftBank Group Corp. Consolidated Financial Report For the Fiscal Year Ended March 31, 2025",
"page_height": 1683.99365234375,
"page_number": 1,
"page_width": 1190.0015869140625,
"segment_id": "DWiMb98",
"segment_type": "PageHeader"
},
// .. more citations
],
"report_title": [
{
"bboxes": [
{
"height": 36.99359893798828,
"left": 792.4896240234375,
"top": 48.959999084472656,
"width": 347.1983642578125
}
],
"citation_id": "uc2mRtn",
"citation_type": "Segment",
"content": "SoftBank Group Corp. Consolidated Financial Report For the Fiscal Year Ended March 31, 2025",
"page_height": 1683.99365234375,
"page_number": 1,
"page_width": 1190.0015869140625,
"segment_id": "DWiMb98",
"segment_type": "PageHeader"
},
// .. more citations
],
"reporting_as_of_date": [
{
"bboxes": [
{
"height": 36.99359893798828,
"left": 792.4896240234375,
"top": 48.959999084472656,
"width": 347.1983642578125
}
],
"citation_id": "rJos6_7",
"citation_type": "Segment",
"content": "SoftBank Group Corp. Consolidated Financial Report For the Fiscal Year Ended March 31, 2025",
"page_height": 1683.99365234375,
"page_number": 1,
"page_width": 1190.0015869140625,
"segment_id": "DWiMb98",
"segment_type": "PageHeader"
},
// .. more citations
],
"reporting_period_end": [
{
"bboxes": [
{
"height": 36.99359893798828,
"left": 792.4896240234375,
"top": 48.959999084472656,
"width": 347.1983642578125
}
],
"citation_id": "vQLvY7M",
"citation_type": "Segment",
"content": "SoftBank Group Corp. Consolidated Financial Report For the Fiscal Year Ended March 31, 2025",
"page_height": 1683.99365234375,
"page_number": 1,
"page_width": 1190.0015869140625,
"segment_id": "DWiMb98",
"segment_type": "PageHeader"
},
// .. more citations
],
"reporting_period_start": [
{
"bboxes": [
{
"height": 36.99359893798828,
"left": 792.4896240234375,
"top": 48.959999084472656,
"width": 347.1983642578125
}
],
"citation_id": "1luS4_E",
"citation_type": "Segment",
"content": "SoftBank Group Corp. Consolidated Financial Report For the Fiscal Year Ended March 31, 2025",
"page_height": 1683.99365234375,
"page_number": 1,
"page_width": 1190.0015869140625,
"segment_id": "DWiMb98",
"segment_type": "PageHeader"
},
// .. more citations
],
"statement_of_cash_flows": {
"currency": [
{
"bboxes": [
{
"height": 643.2047729492188,
"left": 112.10399627685548,
"top": 153.20159912109375,
"width": 949.4207763671876
}
],
"citation_id": "la9E9zd",
"citation_type": "Segment",
"content": "<table>\n<tr>\n<td></td>\n<td colspan=\"2\">(Millions of yen)</td>\n</tr>\n<tr>\n<td></td>\n<td>Fiscal year ended March 31, 2024</td>\n<td>Fiscal year ended March 31, 2025</td>\n</tr>\n<tr>\n<td>Cash flows from operating activities</td>\n<td></td>\n<td></td>\n</tr>\n<tr>\n<td>Net income</td>\n<td>209,217</td>\n<td>1,603,108</td>\n</tr>\n<tr>\n<td>Depreciation and amortization</td>\n<td>858,620</td>\n<td>866,823</td>\n</tr>\n<tr>\n<td>Loss (gain) on investments at Investment Business of Holding Companies</td>\n<td>449,817</td>\n<td>(3,422,188)</td>\n</tr>\n<tr>\n<td>Loss (gain) on investments at SoftBank Vision Funds</td>\n<td>167,290</td>\n<td>(387,584)</td>\n</tr>\n<tr>\n<td>Finance cost</td>\n<td>556,004</td>\n<td>581,559</td>\n</tr>\n<tr>\n<td>Foreign exchange loss (gain)</td>\n<td>703,122</td>\n<td>(27,055)</td>\n</tr>\n<tr>\n<td>Derivative (gain) loss (excluding (gain) loss on investments)</td>\n<td>(1,502,326)</td>\n<td>2,034,029</td>\n</tr>\n<tr>\n<td>Change in third-party interests in SVF</td>\n<td>390,137</td>\n<td>491,898</td>\n</tr>\n<tr>\n<td>(Gain) loss on other investments and other gain</td>\n<td>(271,064)</td>\n<td>(253,953)</td>\n</tr>\n<tr>\n<td>Income taxes</td>\n<td>(151,416)</td>\n<td>101,613</td>\n</tr>\n<tr>\n<td>Increase in investments from asset management subsidiaries</td>\n<td>(230,986)</td>\n<td>(769,572)</td>\n</tr>\n<tr>\n<td>Increase in trade and other receivables</td>\n<td>(476,511)</td>\n<td>(508,544)</td>\n</tr>\n<tr>\n<td>Decrease (increase) in inventories</td>\n<td>5,436</td>\n<td>(40,000)</td>\n</tr>\n<tr>\n<td>Increase in trade and other payables</td>\n<td>325,731</td>\n<td>237,030</td>\n</tr>\n<tr>\n<td>Other</td>\n<td>208,593</td>\n<td>93,974</td>\n</tr>\n<tr>\n<td>Subtotal</td>\n<td>1,241,664</td>\n<td>601,138</td>\n</tr>\n<tr>\n<td>Interest and dividends received</td>\n<td>256,083</td>\n<td>299,714</td>\n</tr>\n<tr>\n<td>Interest paid</td>\n<td>(430,422)</td>\n<td>(482,111)</td>\n</tr>\n<tr>\n<td>Income taxes paid</td>\n<td>(885,617)</td>\n<td>(380,008)</td>\n</tr>\n<tr>\n<td>Income taxes refunded</td>\n<td>68,839</td>\n<td>164,847</td>\n</tr>\n<tr>\n<td>Net cash provided by operating activities</td>\n<td>250,547</td>\n<td>203,580</td>\n</tr>\n</table>",
"page_height": 1683.99365234375,
"page_number": 9,
"page_width": 1190.0015869140625,
"segment_id": "r9RNukJ",
"segment_type": "Table"
},
// .. more citations
],
// .. more items
},
// .. more statements
}
Metrics
Metrics
Copy
Ask AI
{
"currency": {
"citation_status": "Created",
"confidence": "High"
},
"entity_name": {
"citation_status": "Created",
"confidence": "High"
},
"report_title": {
"citation_status": "Created",
"confidence": "High"
},
"reporting_as_of_date": {
"citation_status": "Created",
"confidence": "High"
},
"reporting_period_end": {
"citation_status": "Created",
"confidence": "High"
},
"reporting_period_start": {
"citation_status": "Created",
"confidence": "High"
},
"statement_of_cash_flows": {
"currency": {
"citation_status": "Created",
"confidence": "High"
},
"periods": [
{
"closing_cash_balance": {
"citation_status": "Created",
"confidence": "High"
},
"items": [
{
"account_name": {
"citation_status": "Created",
"confidence": "High"
}
}
// .. more items
]
}
// .. more periods
]
}
// .. more metrics
}
Medical Benefits Claim
Extract key medical benefits claim data from medical benefits claim documents.Schema
Copy
Ask AI
import os
from datetime import date
from decimal import Decimal
from typing import List, Optional
from chunkr_ai import Chunkr
from pydantic import BaseModel
class Address(BaseModel):
line1: Optional[str]
line2: Optional[str]
city: Optional[str]
state: Optional[str]
country: Optional[str]
postal_code: Optional[str]
raw: Optional[str]
class EmployeeInfo(BaseModel):
employer_name: Optional[str]
policy_group_number: Optional[str]
aetna_id: Optional[str]
full_name: Optional[str]
birthdate: Optional[date]
employment_status: Optional[str]
date_of_retirement: Optional[date]
address: Optional[Address]
phone: Optional[str]
class PatientInfo(BaseModel):
full_name: Optional[str]
aetna_id: Optional[str]
birthdate: Optional[date]
relationship_to_employee: Optional[str]
address: Optional[Address]
gender: Optional[str]
marital_status: Optional[str]
employed: Optional[bool]
employer_name: Optional[str]
employer_address: Optional[Address]
class ClaimCircumstances(BaseModel):
accident_related: Optional[bool]
accident_date: Optional[date]
accident_time: Optional[str]
employment_related: Optional[bool]
other_coverage: Optional[bool]
other_insurance_company: Optional[str]
other_policy_number: Optional[str]
other_policy_holder: Optional[str]
class Authorization(BaseModel):
patient_signature: Optional[str]
patient_signature_date: Optional[date]
assignment_of_benefits_signature: Optional[str]
assignment_date: Optional[date]
class FacilityInfo(BaseModel):
name: Optional[str]
address: Optional[Address]
admission_date: Optional[date]
discharge_date: Optional[date]
class Diagnosis(BaseModel):
primary: Optional[str]
secondary: Optional[List[str]]
icd_codes: Optional[List[str]]
class ProcedureEntry(BaseModel):
service_date: Optional[date]
place_of_service: Optional[str]
procedure_code: Optional[str]
description: Optional[str]
type_of_service: Optional[str]
charge: Optional[Decimal]
units: Optional[int]
diagnosis_code: Optional[str]
class PhysicianInfo(BaseModel):
full_name: Optional[str]
address: Optional[Address]
phone: Optional[str]
taxpayer_id: Optional[str]
patient_account_number: Optional[str]
national_provider_identifier: Optional[str]
signature: Optional[str]
signature_date: Optional[date]
class BillingSummary(BaseModel):
total_charge: Optional[Decimal]
amount_paid: Optional[Decimal]
balance_due: Optional[Decimal]
class MedicalBenefitsClaim(BaseModel):
employee: Optional[EmployeeInfo]
patient: Optional[PatientInfo]
claim_circumstances: Optional[ClaimCircumstances]
authorization: Optional[Authorization]
physician: Optional[PhysicianInfo]
facility: Optional[FacilityInfo]
diagnosis: Optional[Diagnosis]
procedures: Optional[List[ProcedureEntry]]
billing: Optional[BillingSummary]
Process
Copy
Ask AI
# Convert Pydantic model to JSON schema
schema = MedicalBenefitsClaim.model_json_schema()
client = Chunkr(api_key=os.environ["CHUNKR_API_KEY"])
# Create extract task
task = client.tasks.extract.create(
file="https://s3.us-east-1.amazonaws.com/chunkr-web/uploads/medical_benefits_claim.pdf",
schema=schema,
)
Output
Copy
Ask AI
{
"authorization": {
"assignment_date": "2025-02-16",
"assignment_of_benefits_signature": "Anderson MJ",
"patient_signature": "Anderson MJ",
"patient_signature_date": "2025-02-16"
},
"billing": {
"amount_paid": 200,
"balance_due": 1600,
"total_charge": 1800
},
"claim_circumstances": {
"accident_date": "2025-02-12",
"accident_related": true,
"accident_time": "3:30 pm",
"employment_related": false,
"other_coverage": false,
"other_insurance_company": null,
"other_policy_holder": null,
"other_policy_number": null
},
"diagnosis": {
"icd_codes": [
"S52.5",
"S50.1"
],
"primary": "Fractured Radius",
"secondary": [
"Contusion of Forearm"
]
},
"employee": {
"address": {
"city": "Springfield",
"country": null,
"line1": "145 E Indian Blvd",
"line2": null,
"postal_code": null,
"raw": "145 E Indian Blvd, Springfield, IL",
"state": "IL"
},
"aetna_id": "E451958",
"birthdate": "1980-03-14",
"date_of_retirement": null,
"employer_name": "Technova Solutions Inc.",
"employment_status": "Active",
"full_name": "Anderson, Mary J.",
"phone": "2155557890",
"policy_group_number": "A124175"
},
"facility": {
"address": {
"city": "Springfield",
"country": null,
"line1": "451 Health Ave",
"line2": null,
"postal_code": "62704",
"raw": "Springfield Community Hospital, 451 Health Ave, Springfield, IL 62704",
"state": "IL"
},
"admission_date": "2025-02-15",
"discharge_date": "2025-02-16",
"name": "Springfield Community Hospital"
},
"patient": {
"address": {
"city": "Springfield",
"country": null,
"line1": "145 E Indian Blvd",
"line2": null,
"postal_code": null,
"raw": "145 E Indian Blvd, Springfield, IL",
"state": "IL"
},
"aetna_id": "P51309",
"birthdate": "2010-06-24",
"employed": false,
"employer_address": null,
"employer_name": null,
"full_name": "John R.",
"gender": "Male",
"marital_status": "Single",
"relationship_to_employee": "Child"
},
"physician": {
"address": {
"city": "Springfield",
"country": null,
"line1": "3 Health Ave",
"line2": "Springfield Orthopedics",
"postal_code": "62705",
"raw": "Springfield Orthopedics, 3 Health Ave, Springfield, IL 62705",
"state": "IL"
},
"full_name": "Dr. Jake Blakey",
"national_provider_identifier": "502357115",
"patient_account_number": "PT-20250215-001",
"phone": "2171527785",
"signature": "Jake B",
"signature_date": "2025-02-16",
"taxpayer_id": "IL-12458"
},
"procedures": [
{
"charge": 250,
"description": "X-ray Forearm",
"diagnosis_code": "S52.5",
"place_of_service": "Outpatient",
"procedure_code": "73090",
"service_date": "2025-02-15",
"type_of_service": "4",
"units": 1
},
{
"charge": 1200,
"description": "Closed Treatment, Radius",
"diagnosis_code": "S52.5",
"place_of_service": "Outpatient",
"procedure_code": "24500",
"service_date": "2025-02-15",
"type_of_service": "2",
"units": 1
},
{
"charge": 350,
"description": "Cast Application",
"diagnosis_code": "S52.5",
"place_of_service": "Outpatient",
"procedure_code": "29125",
"service_date": "2025-02-15",
"type_of_service": "1",
"units": 1
}
]
}
Citations
Citations
Copy
Ask AI
{
"authorization": {
"assignment_date": [
{
"bboxes": [
{
"height": 415.67041015625,
"left": 175.01759338378906,
"top": 1571.587158203125,
"width": 3364.04150390625
}
],
"citation_id": "jWTG4_G",
"citation_type": "Segment",
"content": "25. To all providers of health care: You are authorized to provide Aetna Life Insurance Company or one of its affiliated companies (\"Aetna\"), and any independent claim administrators and consulting health professionals and utilization review organizations with whom Aetna has contracted, information concerning health care advice, treatment or supplies provided the patient (including that relating to mental illness and/or AIDS/ARC/HIV). This information will be used to evaluate claims for benefits. Aetna may provide the employer named above with any benefit calculation used in payment of this claim for the purpose of reviewing the experience and operation of the policy or contract. This authorization is valid for the term of the policy or contract under which a claim has been submitted. I know that I have a right to receive a copy of this authorization upon request and agree that a photographic copy of this authorization is as valid as the original. Patient's or Authorized Person's Signature Anderson My Date 02/16/2025",
"page_height": 5262.0048828125,
"page_number": 1,
"page_width": 3719.9951171875,
"segment_id": "BLnBeE4",
"segment_type": "Text"
},
// .. more citations
],
// .. more items
},
"billing": {
"amount_paid": [
{
"bboxes": [
{
"height": 191.908935546875,
"left": 2772.96484375,
"top": 3721.60791015625,
"width": 780.81103515625
}
],
"citation_id": "vvodDdV",
"citation_type": "Segment",
"content": "<table>\n <tr>\n <td>43. Total charge</td>\n <td>$</td>\n <td>1800</td>\n </tr>\n <tr>\n <td>Amount paid</td>\n <td>$</td>\n <td>200</td>\n </tr>\n <tr>\n <td>Balance due</td>\n <td>$</td>\n <td>1600</td>\n </tr>\n</table>",
"page_height": 5262.0048828125,
"page_number": 1,
"page_width": 3719.9951171875,
"segment_id": "-GT9tT6",
"segment_type": "Table"
},
// .. more citations
],
// .. more items
},
"claim_circumstances": {
"accident_date": [
{
"bboxes": [
{
"height": 1227.672119140625,
"left": 165.268798828125,
"top": 351.15838623046875,
"width": 3391.847900390625
}
],
"citation_id": "MiC7PM2",
"citation_type": "Segment",
"content": "<table>\n <tbody>\n <tr>\n <td>1. Employer's Name<br><b>Technova Solutions Inc.</b></td>\n <td>2. Policy/Group Number<br><b>A124175</b></td>\n </tr>\n <tr>\n <td>3. Employee's Aetna ID Number<br><b>E451958</b></td>\n <td>4. Employee's Name<br><b>Anderson, Mary J.</b></td>\n <td>5. Employee's Birthdate (MM/DD/YYYY)<br><b>03/14/1980</b></td>\n </tr>\n <tr>\n <td>6. ☑ Active ☐ Retired<br>Date of Retirement</td>\n <td>7. Employee's Address (include ZIP Code)<br><b>145 E Indian Blvd, Springfield, IL</b></td>\n <td>☑ Address is new</td>\n <td>8. Employee's Daytime Telephone Number<br><b>( 215 ) 555-7890</b></td>\n </tr>\n <tr>\n <td>9. Patient's Name<br><b>John R.</b></td>\n <td>10. Patient's Aetna ID Number<br><b>P51309</b></td>\n <td>11. Patient's Birthdate (MM/DD/YYYY)<br><b>06/24/2010</b></td>\n <td>12. Patient's Relationship to Employee<br>☐ Self ☐ Spouse ☑ Child ☐ Other</td>\n </tr>\n <tr>\n <td colspan=\"3\">13. Patient's Address (if different from employee)</td>\n <td>14. Patient's Gender<br>☑ Male ☐ Female</td>\n </tr>\n <tr>\n <td>15. Patient's Marital Status<br>☐ Married ☑ Single</td>\n <td>16. Is patient employed?<br>☑ No ☐ Yes</td>\n <td colspan=\"2\">17. Name & Address of Employer</td>\n </tr>\n <tr>\n <td colspan=\"3\">18. Is claim related to an accident?<br>☐ No ☑ Yes If Yes, date <b>02/12/2025</b> time <b>3:30</b> ☐ am ☑ pm</td>\n <td>19. Is claim related to employment?<br>☑ No ☑ Yes</td>\n </tr>\n <tr>\n <td>20. Are any family members expenses covered by another group health plan, group pre-payment plan (Blue Cross- Blue Shield, etc.), no fault auto insurance, Medicare or any federal, state or local government plan?<br>☑ No ☐ Yes</td>\n <td colspan=\"3\">21. If Yes, list policy or contract holder, policy or contract number(s) and name/address of insurance company or administrator:</td>\n </tr>\n <tr>\n <td>22. Member's ID Number</td>\n <td>23. Member's Name</td>\n <td colspan=\"2\">24. Member's Birthdate (MM/DD/YYYY)</td>\n </tr>\n </tbody>\n</table>",
"page_height": 5262.0048828125,
"page_number": 1,
"page_width": 3719.9951171875,
"segment_id": "qdlXRQf",
"segment_type": "Table"
},
{
"bboxes": [
{
"height": 47.9520263671875,
"left": 674.9423828125,
"top": 844.3008422851562,
"width": 245.9520263671875
}
],
"citation_id": "46uANRd",
"citation_type": "Word",
"content": "02/12/2025",
"page_height": 5262.0048828125,
"page_number": 1,
"page_width": 3719.9951171875,
"segment_id": null,
"segment_type": "Text"
}
],
// .. more items
"other_insurance_company": null,
"other_policy_holder": null,
"other_policy_number": null
},
"diagnosis": {
"icd_codes": [
{
"bboxes": [
{
"height": 53.0927734375,
"left": 180.36000061035156,
"top": 2770.257568359375,
"width": 677.7504272460938
}
],
"citation_id": "JsWdVrh",
"citation_type": "Segment",
"content": "1. Fractured Radius (ICD-10 S52.5)",
"page_height": 5262.0048828125,
"page_number": 1,
"page_width": 3719.9951171875,
"segment_id": "Hol6zze",
"segment_type": "Text"
},
// .. more citations
],
// .. more items
},
"employee": {
"address": {
"city": [
{
"bboxes": [
{
"height": 1227.672119140625,
"left": 165.268798828125,
"top": 351.15838623046875,
"width": 3391.847900390625
}
],
"citation_id": "W3_iKpQ",
"citation_type": "Segment",
"content": "<table>\n <tbody>\n <tr>\n <td>1. Employer's Name<br><b>Technova Solutions Inc.</b></td>\n <td>2. Policy/Group Number<br><b>A124175</b></td>\n </tr>\n <tr>\n <td>3. Employee's Aetna ID Number<br><b>E451958</b></td>\n <td>4. Employee's Name<br><b>Anderson, Mary J.</b></td>\n <td>5. Employee's Birthdate (MM/DD/YYYY)<br><b>03/14/1980</b></td>\n </tr>\n <tr>\n <td>6. ☑ Active ☐ Retired<br>Date of Retirement</td>\n <td>7. Employee's Address (include ZIP Code)<br><b>145 E Indian Blvd, Springfield, IL</b></td>\n <td>☑ Address is new</td>\n <td>8. Employee's Daytime Telephone Number<br><b>( 215 ) 555-7890</b></td>\n </tr>\n <tr>\n <td>9. Patient's Name<br><b>John R.</b></td>\n <td>10. Patient's Aetna ID Number<br><b>P51309</b></td>\n <td>11. Patient's Birthdate (MM/DD/YYYY)<br><b>06/24/2010</b></td>\n <td>12. Patient's Relationship to Employee<br>☐ Self ☐ Spouse ☑ Child ☐ Other</td>\n </tr>\n <tr>\n <td colspan=\"3\">13. Patient's Address (if different from employee)</td>\n <td>14. Patient's Gender<br>☑ Male ☐ Female</td>\n </tr>\n <tr>\n <td>15. Patient's Marital Status<br>☐ Married ☑ Single</td>\n <td>16. Is patient employed?<br>☑ No ☐ Yes</td>\n <td colspan=\"2\">17. Name & Address of Employer</td>\n </tr>\n <tr>\n <td colspan=\"3\">18. Is claim related to an accident?<br>☐ No ☑ Yes If Yes, date <b>02/12/2025</b> time <b>3:30</b> ☐ am ☑ pm</td>\n <td>19. Is claim related to employment?<br>☑ No ☑ Yes</td>\n </tr>\n <tr>\n <td>20. Are any family members expenses covered by another group health plan, group pre-payment plan (Blue Cross- Blue Shield, etc.), no fault auto insurance, Medicare or any federal, state or local government plan?<br>☑ No ☐ Yes</td>\n <td colspan=\"3\">21. If Yes, list policy or contract holder, policy or contract number(s) and name/address of insurance company or administrator:</td>\n </tr>\n <tr>\n <td>22. Member's ID Number</td>\n <td>23. Member's Name</td>\n <td colspan=\"2\">24. Member's Birthdate (MM/DD/YYYY)</td>\n </tr>\n </tbody>\n</table>",
"page_height": 5262.0048828125,
"page_number": 1,
"page_width": 3719.9951171875,
"segment_id": "qdlXRQf",
"segment_type": "Table"
},
// .. more citations
],
// .. more items
},
// .. more items
},
"facility": {
"address": {
"city": [
{
"bboxes": [
{
"height": 63.54736328125,
"left": 182.9664001464844,
"top": 2644.847900390625,
"width": 1697.3568115234375
}
],
"citation_id": "VbxB14m",
"citation_type": "Segment",
"content": "Springfield Community Hospital, 451 Health Ave, Springfield, IL 62704",
"page_height": 5262.0048828125,
"page_number": 1,
"page_width": 3719.9951171875,
"segment_id": "OkZta-w",
"segment_type": "Text"
},
// .. more citations
],
// .. more items
},
// .. more items
},
// .. more items
}
Metrics
Metrics
Copy
Ask AI
{
"authorization": {
"assignment_date": {
"citation_status": "Created",
"confidence": "High"
},
"assignment_of_benefits_signature": {
"citation_status": "Created",
"confidence": "High"
},
"patient_signature": {
"citation_status": "Created",
"confidence": "High"
},
"patient_signature_date": {
"citation_status": "Created",
"confidence": "High"
}
},
"billing": {
"amount_paid": {
"citation_status": "Created",
"confidence": "High"
},
"balance_due": {
"citation_status": "Created",
"confidence": "High"
},
"total_charge": {
"citation_status": "Created",
"confidence": "High"
}
},
"claim_circumstances": {
"accident_date": {
"citation_status": "Created",
"confidence": "High"
},
"accident_related": {
"citation_status": "Created",
"confidence": "High"
},
"accident_time": {
"citation_status": "Created",
"confidence": "High"
},
"employment_related": {
"citation_status": "Created",
"confidence": "High"
},
"other_coverage": {
"citation_status": "Created",
"confidence": "High"
},
"other_insurance_company": {
"citation_status": "Skipped",
"confidence": "High"
},
"other_policy_holder": {
"citation_status": "Skipped",
"confidence": "High"
},
"other_policy_number": {
"citation_status": "Skipped",
"confidence": "High"
}
},
"diagnosis": {
"icd_codes": {
"citation_status": "Created",
"confidence": "High"
},
"primary": {
"citation_status": "Created",
"confidence": "High"
},
"secondary": {
"citation_status": "Created",
"confidence": "High"
}
},
"employee": {
"address": {
"city": {
"citation_status": "Created",
"confidence": "High"
},
// .. more items
},
"aetna_id": {
"citation_status": "Created",
"confidence": "High"
},
"birthdate": {
"citation_status": "Created",
"confidence": "High"
},
"date_of_retirement": {
"citation_status": "Skipped",
"confidence": "High"
},
"employer_name": {
"citation_status": "Created",
"confidence": "High"
},
"employment_status": {
"citation_status": "Created",
"confidence": "High"
},
"full_name": {
"citation_status": "Created",
"confidence": "High"
},
"phone": {
"citation_status": "Created",
"confidence": "High"
},
"policy_group_number": {
"citation_status": "Created",
"confidence": "High"
}
},
"facility": {
"address": {
"city": {
"citation_status": "Created",
"confidence": "High"
},
// .. more items
},
"admission_date": {
"citation_status": "Created",
"confidence": "High"
},
"discharge_date": {
"citation_status": "Created",
"confidence": "High"
},
"name": {
"citation_status": "Created",
"confidence": "High"
}
},
"patient": {
"address": {
"city": {
"citation_status": "Created",
"confidence": "High"
},
// .. more items
},
"aetna_id": {
"citation_status": "Created",
"confidence": "High"
},
// .. more items
},
"physician": {
"address": {
"city": {
"citation_status": "Created",
"confidence": "High"
},
// .. more items
},
"full_name": {
"citation_status": "Created",
"confidence": "High"
},
"national_provider_identifier": {
"citation_status": "Created",
"confidence": "High"
},
"patient_account_number": {
"citation_status": "Created",
"confidence": "High"
},
"phone": {
"citation_status": "Created",
"confidence": "High"
},
"signature": {
"citation_status": "Created",
"confidence": "Low"
},
"signature_date": {
"citation_status": "Created",
"confidence": "High"
},
"taxpayer_id": {
"citation_status": "Created",
"confidence": "High"
}
},
"procedures": [
{
"charge": {
"citation_status": "Created",
"confidence": "High"
},
"description": {
"citation_status": "Created",
"confidence": "High"
},
"diagnosis_code": {
"citation_status": "Created",
"confidence": "High"
},
"place_of_service": {
"citation_status": "Created",
"confidence": "High"
},
"procedure_code": {
"citation_status": "Created",
"confidence": "High"
},
"service_date": {
"citation_status": "Created",
"confidence": "Low"
},
"type_of_service": {
"citation_status": "Created",
"confidence": "High"
},
"units": {
"citation_status": "Created",
"confidence": "High"
}
}
// .. more procedures
]
}
Best Practices
Schema Design Tips
- Use Descriptive Field Names: Choose clear, unambiguous field names that reflect the actual data being extracted.
- Handle Optional Fields Appropriately: Mark fields as optional when they may not be present in all documents.
-
Include Field Descriptions: Use Pydantic’s
Field(description="...")
or Zod’s.describe()
to provide context. - Use Appropriate Data Types: Choose the right types (string, number, boolean, array, date) for each field.
Extraction Optimization
- Custom System Prompts: Tailor prompts to your document type. See the system prompt parameter for details.
- Quality Validation: Use citation trails alongside confidence scores to validate extractions.
Confidence values are currently experimental. Treat them as a heuristic for
ranking rather than a definitive measure of correctness. We
recommend using them conservatively and pairing scores with citation
reviews.