diff --git a/.github/workflows/pypi-publish.yml b/.github/workflows/pypi-publish.yml
index 2fed051..5cfa82b 100644
--- a/.github/workflows/pypi-publish.yml
+++ b/.github/workflows/pypi-publish.yml
@@ -12,13 +12,13 @@ jobs:
     runs-on: ubuntu-latest
 
     steps:
-    - uses: actions/checkout@v4
+    - uses: actions/checkout@v6
     - name: Set up Python
-      uses: actions/setup-python@v5
+      uses: actions/setup-python@v6
       with:
-        python-version: '3.11'
+        python-version: '3.12'
     - name: Install uv
-      uses: astral-sh/setup-uv@v5
+      uses: astral-sh/setup-uv@v8.1.0
     - name: Build
       run: uv build
     - name: Publish
diff --git a/.github/workflows/run-pytest.yml b/.github/workflows/run-pytest.yml
index 8b294f0..68547c4 100644
--- a/.github/workflows/run-pytest.yml
+++ b/.github/workflows/run-pytest.yml
@@ -18,15 +18,15 @@ jobs:
         python-version: ['3.11', '3.12', '3.13']
 
     steps:
-    - uses: actions/checkout@v4
+    - uses: actions/checkout@v6
     - name: Set up Python ${{ matrix.python-version }}
-      uses: actions/setup-python@v5
+      uses: actions/setup-python@v6
       with:
         python-version: ${{ matrix.python-version }}
     - name: Install uv
-      uses: astral-sh/setup-uv@v5
+      uses: astral-sh/setup-uv@v8.1.0
     - name: Install dependencies
-      run: uv sync --all-extras --dev
+      run: uv sync --dev
     - name: Extract test files
       run: ./.github/scripts/extract_files.sh
       env:
@@ -44,8 +44,10 @@ jobs:
         KFINTECH_CAS_FILE_NEW: ${{ secrets.KFINTECH_CAS_FILE_NEW }}
         KFINTECH_CAS_PASSWORD: ${{ secrets.KFINTECH_CAS_PASSWORD }}
         NSDL_CAS_FILE_1: ${{ secrets.NSDL_CAS_FILE_1 }}
+        CDSL_CAS_FILE_1: ${{ secrets.CDSL_CAS_FILE_1 }}
+        CDSL_CAS_PASSWORD: ${{ secrets.CDSL_CAS_PASSWORD }}
     - name: Upload coverage report to codecov
-      uses: codecov/codecov-action@v5
+      uses: codecov/codecov-action@v6
       with:
         files: ./coverage.xml
         token: ${{ secrets.CODECOV_TOKEN }}
diff --git a/.gitignore b/.gitignore
index 19b9779..359c00a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -133,6 +133,7 @@ dmypy.json
 tests/files/**
 tests/files.tar
 tests/files.tar.bz2
+tests/samples/**
 .DS_Store
 
 casparser.code-workspace
diff --git a/CHANGELOG.md b/CHANGELOG.md
index c3a39c0..8fa82ed 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,7 +1,71 @@
 # Changelog
 
+## 1.0.0
+
+Major release. The parsing backend was rewritten from scratch on
+[pypdfium2](https://github.com/pypdfium2-team/pypdfium2) (Apache-2.0 /
+BSD-3) and the four supported CAS issuers now each have a dedicated
+parser tuned to their template family.
+
+### Breaking changes
+
+- **pdfminer.six and PyMuPDF backends removed.** `casparser.read_cas_pdf`
+  no longer dispatches between them. The `mupdf` / `fast` extras in
+  `pyproject.toml` are gone. The `--force-pdfminer` CLI flag and the
+  `force_pdfminer=` kwarg on `read_cas_pdf` are kept as no-ops; the
+  kwarg emits a `DeprecationWarning` and is otherwise ignored.
+- **License simplified to pure MIT.** With the GPL/AGPL-licensed
+  PyMuPDF dependency gone, the `licenses/` directory of GPL/AGPL
+  copies has been removed. pypdfium2 is dual Apache-2.0 / BSD-3 and
+  doesn't impose any copyleft obligation on users of casparser.
+- **Minimum Python is now 3.11.** 3.9 / 3.10 classifiers dropped from
+  `pyproject.toml`.
+- **`CASData.investor_info` is now `Optional[InvestorInfo]`** (matches
+  the `NSDLCASData.investor_info` shape that already existed). It is
+  populated on every supported issuer, but consumers should still
+  guard against the `None` case for unfamiliar templates.
+- **Internal `casparser.process` package removed.** The two helpers
+  downstream code still imports from it are now at
+  `casparser.parsers._classify` (`get_parsed_scheme_name`,
+  `get_transaction_type`) and `casparser.parsers._isin` (`isin_search`).
+
+### New
+
+- **First-class NSDL and CDSL parsers.** Drops the regex-on-text
+  approach the 0.8 NSDL/CDSL code used; the new parsers consume
+  structured `Block`/`Cell` records directly from `pypdfium2`. Several
+  bugs the v0.8 NSDL/CDSL code shipped with are no longer in scope
+  (misplaced-UCC-as-folio on NSDL MF Holdings, space-merged
+  folio+units cells on CDSL, the silently-dropped NSDL HDFC
+  subaccount on CDSL multi-account statements, `Optional[Decimal]`
+  comma-strip miss in the `MutualFund` validator).
+- **CAMS / KFin 2026 templates supported** out of the box. The newer
+  CAMS SUMMARY template added an ISIN column the v0.8 regex didn't
+  match; v1.0 parses all rows. The newer KFin SUMMARY template emits
+  zero-balance schemes with single-space-separated trio cells that
+  the v0.8 regex required `\t\t` between; v1.0 picks them up too.
+- **AMC-header detection extended** to include the `Fund House`
+  suffix. v0.8's regex only matched `Mutual Fund` / `MF` suffixes,
+  so schemes from a few newer AMCs whose names end in `Fund House`
+  ended up bucketed under the previous AMC.
+- **ISIN / AMFI enrichment has a direct-ISIN fallback** path via
+  `MFISINDb.direct_isin_lookup` for the case where multi-line
+  `Registrar:` rendering corrupts the RTA token.
+
+### Fixed
+
+- **CAMS SUMMARY `valuation.date` no longer mis-parses to year 201**
+  (was a column-boundary bug — the NAVDate column treated as
+  right-aligned with a 42pt width clipped the trailing year digit,
+  then Pydantic mis-coerced the `01-Jan-201` string).
+- **CDSL multi-account statements** (5+ demat accounts on one PDF) are
+  now parsed correctly. Earlier the page-3+ scan only kicked in from
+  page 8, dropping holdings sections that landed on pages 4-7.
+- **CDSL MF holdings** rows with `DIRECT` (or any non-`ARN-XXXX`
+  distribution-mode token) now correctly populate `pnl` and `return_`.
+
 ## 0.9.0 - 2026-05-22
-- Add support for CDSL sttements
+- Add support for CDSL statements
 - Drop support for Python 3.9 and 3.10; minimum supported version is now 3.11
 - Support PyMuPDF >= 1.25 (1.27.x tested). Older `<1.25` pin removed.
 - Bump `casparser-isin` to `>= 2026.5.1` (new DB format v2 with
@@ -11,20 +75,9 @@
   field (Python attribute `return_`) also gets the comma-stripping
   treatment; previously NSDL MF folio rows with a return value of
   1 lakh or more would fail Decimal validation.
-- Parser robustness fixes for PyMuPDF 1.25+ text extraction quirks:
-  - Re-emit visual rows as separate blocks for CAMS/KFINTECH so the
-    table header / folio header no longer get merged when the new
-    block grouping collapses them into a single PyMuPDF block.
-  - Recover the registrar value (e.g. `KFINTECH`) when it wraps to the
-    next line.
-  - Recover the advisor value when the scheme name wraps before the
-    advisor closing paren.
-  - Pull ISIN/Advisor onto the scheme line when long scheme names wrap.
-  - Tax transactions (`*** Stamp Duty ***`, STT, TDS) no longer absorb
-    spurious units when an adjacent column wraps onto the same row.
-  - NSDL holdings: widen the y-band tolerance, drop the strict
-    multiline `$` anchoring, and accept tab-separated wrapped names so
-    the regexes match consistently across Python 3.11–3.14.
+- Parser robustness fixes for PyMuPDF 1.25+ text extraction quirks
+  (all superseded in 1.0.0 by the pypdfium2 rewrite, kept here for
+  the historical record).
 
 ## 0.8.1 - 2025-09-21
 - NSDL parser bug fixes
diff --git a/README.md b/README.md
index 7843491..8c53e41 100644
--- a/README.md
+++ b/README.md
@@ -6,7 +6,8 @@
 [![codecov](https://codecov.io/gh/codereverser/casparser/branch/main/graph/badge.svg?token=DYZ7TXWRGI)](https://codecov.io/gh/codereverser/casparser)
 ![PyPI - Python Version](https://img.shields.io/pypi/pyversions/casparser)
 
-Parse Consolidated Account Statement (CAS) PDF files generated from CAMS/KFINTECH
+Parse Consolidated Account Statement (CAS) PDF files generated from
+CAMS, KFintech, NSDL, and CDSL.
 
 `casparser` also includes a command line tool with the following analysis tools
 - `summary`- print portfolio summary
@@ -19,13 +20,8 @@ Parse Consolidated Account Statement (CAS) PDF files generated from CAMS/KFINTEC
 pip install -U casparser
 ```
 
-### with faster PyMuPDF parser
-```bash
-pip install -U 'casparser[fast]'
-```
-
-**Note:** Enabling this dependency could result in licensing changes. Check the
-[License](#license) section for more details
+Since v1.0 the parser is built on [pypdfium2](https://github.com/pypdfium2-team/pypdfium2)
+(Apache-2.0 / BSD-3) — no optional PDF backends, no GPL/AGPL dependencies.
 
 
 ## Usage
@@ -50,7 +46,7 @@ csv_str = casparser.read_cas_pdf("/path/to/cas/file.pdf", "password", output="cs
         "from": "YYYY-MMM-DD",
         "to": "YYYY-MMM-DD"
     },
-    "file_type": "CAMS/KARVY/UNKNOWN",
+    "file_type": "CAMS/KFINTECH/NSDL/CDSL/UNKNOWN",
     "cas_type": "DETAILED/SUMMARY",
     "investor_info": {
         "email": "string",
@@ -122,6 +118,9 @@ Notes:
   - `MISC`
 - `dividend_rate` is applicable only for `DIVIDEND_PAYOUT` and
   `DIVIDEND_REINVESTMENT` transactions.
+- NSDL and CDSL statements return a different top-level shape with
+  `accounts[].equities[]` and `accounts[].mutual_funds[]` instead of
+  `folios[].schemes[]`. See `casparser.types.NSDLCASData` for details.
 
 ### CLI
 
@@ -143,8 +142,6 @@ Usage: casparser [-o output_file.json|output_file.csv] [-p password] [-s] [-a] C
   --gains-112a ask|FY2020-21      Generate Capital Gains Report - 112A format for
                                   a given financial year - Use 'ask' for a prompt
                                   from available options (BETA)
-  --force-pdfminer                Force PDFMiner parser even if MuPDF is
-                                  detected
 
   --version                       Show the version and exit.
   -h, --help                      Show this message and exit.
@@ -199,11 +196,16 @@ failing scheme name(s).
 
 ## License
 
-CASParser is distributed under MIT license by default. However enabling the optional dependency
-`mupdf/fast` would imply the use of [PyMuPDF](https://github.com/pymupdf/PyMuPDF) /
-[MuPDF](https://mupdf.com/license.html) and hence the licenses GNU GPL v3 and GNU Affero GPL v3
-would apply. Copies of all licenses have been included in this repository. - _IANAL_
+CASParser is distributed under the MIT license. Up to v0.8 the optional
+`mupdf` / `fast` extra pulled in [PyMuPDF](https://github.com/pymupdf/PyMuPDF) /
+[MuPDF](https://mupdf.com/license.html), which would have caused GNU GPL v3
+and GNU Affero GPL v3 to apply transitively. v1.0 dropped that extra
+(the PyMuPDF and pdfminer.six backends are gone; the parser now runs on
+[pypdfium2](https://github.com/pypdfium2-team/pypdfium2), which is dual
+Apache-2.0 / BSD-3), so casparser is now pure MIT end-to-end.
 
 ## Resources
 1. [CAS from CAMS](https://www.camsonline.com/Investors/Statements/Consolidated-Account-Statement)
 2. [CAS from Karvy/Kfintech](https://mfs.kfintech.com/investor/General/ConsolidatedAccountStatement)
+3. [NSDL Consolidated Account Statement](https://nsdlcas.nsdl.com/)
+4. [CDSL Consolidated Account Statement](https://www.cdslindia.com/Investors/Cas.html)
diff --git a/casparser/__init__.py b/casparser/__init__.py
index 3684a46..a7615e5 100644
--- a/casparser/__init__.py
+++ b/casparser/__init__.py
@@ -9,4 +9,4 @@
     "CapitalGainsReport",
 ]
 
-__version__ = "0.9.0"
+__version__ = "1.0.0"
diff --git a/casparser/cli.py b/casparser/cli.py
index 9762422..63cce9f 100644
--- a/casparser/cli.py
+++ b/casparser/cli.py
@@ -37,7 +37,7 @@ def formatINR(number):
     else:
         last3 = int_part[-3:]
         rest = int_part[:-3]
-        groups = [rest[max(0, i - 2):i or None] for i in range(len(rest), 0, -2)][::-1]
+        groups = [rest[max(0, i - 2) : i or None] for i in range(len(rest), 0, -2)][::-1]
         if groups and groups[0]:
             r = ",".join(groups + [last3])
         else:
@@ -82,7 +82,7 @@ def print_nsdl(parsed_data: NSDLCASData):
     )
     summary_table.add_row(Padding("File Type :", spacing), f"[bold]{data['file_type']}[/]")
     # summary_table.add_row(Padding("CAS Type :", spacing), f"[bold]{data['cas_type']}[/]")
-    for key, value in data["investor_info"].items():
+    for key, value in (data.get("investor_info") or {}).items():
         summary_table.add_row(
             Padding(f"{key.capitalize()} :", spacing), re.sub(r"[^\S\r\n]+", " ", value)
         )
@@ -208,7 +208,7 @@ def print_summary(parsed_data: CASData, output_filename=None, include_zero_folio
     summary_table.add_row(Padding("File Type :", spacing), f"[bold]{data['file_type']}[/]")
     summary_table.add_row(Padding("CAS Type :", spacing), f"[bold]{data['cas_type']}[/]")
 
-    for key, value in data["investor_info"].items():
+    for key, value in (data.get("investor_info") or {}).items():
         summary_table.add_row(
             Padding(f"{key.capitalize()} :", spacing), re.sub(r"[^\S\r\n]+", " ", value)
         )
diff --git a/casparser/parsers/__init__.py b/casparser/parsers/__init__.py
index efdbf3e..a56ad4c 100644
--- a/casparser/parsers/__init__.py
+++ b/casparser/parsers/__init__.py
@@ -1,72 +1,156 @@
+"""Top-level dispatcher for `casparser.read_cas_pdf`.
+
+v1.0 reorganisation: pdfminer.six and PyMuPDF are gone. Everything
+runs on pypdfium2 with parsers that consume structured page-object
+data directly (no text-rendering / regex round-trip for NSDL+CDSL,
+column-aware layout reading for CAMS+KFin).
+
+The four issuer-specific parsers live alongside this file:
+
+  cams_detailed.py  → CAMS / KFin DETAILED statements
+  cams_summary.py   → CAMS / KFin SUMMARY statements
+  nsdl.py           → NSDL Consolidated Account Statement
+  cdsl.py           → CDSL Consolidated Account Statement
+
+`read_cas_pdf` sniffs the issuer + statement variant from the PDF's
+first page, dispatches to the right parser, optionally sorts
+transactions chronologically, and returns either `CASData` (CAMS/KFin)
+or `NSDLCASData` (NSDL/CDSL).
+"""
+
+from __future__ import annotations
+
 import io
+import warnings
 from typing import Union
 
-from casparser.process import process_cas_text
-from casparser.types import CASData, NSDLCASData, ProcessedCASData
+from casparser.enums import CASFileType, FileType
+from casparser.exceptions import CASParseError
+from casparser.types import CASData, NSDLCASData
 
+from .detect import _open_document, detect_cas_type, detect_file_type
 from .utils import cas2csv, cas2json
 
 
+def _sort_transactions(data: CASData) -> CASData:
+    """For each scheme, sort transactions by date and re-compute the
+    running balance from the opening balance."""
+    for folio in data.folios:
+        for idx, scheme in enumerate(folio.schemes):
+            dates = [x.date for x in scheme.transactions]
+            if dates == sorted(dates):
+                continue
+            sorted_txns = []
+            balance = scheme.open
+            for txn in sorted(scheme.transactions, key=lambda x: x.date):
+                balance += txn.units or 0
+                txn.balance = balance
+                sorted_txns.append(txn)
+            scheme.transactions = sorted_txns
+            folio.schemes[idx] = scheme
+    return data
+
+
 def read_cas_pdf(
     filename: Union[str, io.IOBase],
-    password,
-    output="dict",
-    sort_transactions=True,
-    force_pdfminer=False,
+    password: str,
+    output: str = "dict",
+    sort_transactions: bool = True,
+    force_pdfminer: bool = False,
 ):
-    """
-    Parse CAS pdf and returns line data.
+    """Parse a Consolidated Account Statement PDF.
 
-    :param filename: CAS pdf file (CAMS or Kfintech)
-    :param password: CAS pdf password
-    :param output: Output format (json,dict)  [default: dict]
-    :param sort_transactions: Sort transactions by date and re-compute balances.
-    :param force_pdfminer: Force pdfminer parser even if mupdf is detected
+    :param filename: path to the CAS PDF (or an open file-like object).
+    :param password: PDF password (most CAS PDFs are encrypted with the
+                     investor's PAN).
+    :param output: `"dict"` (default) returns the typed model directly,
+                   `"json"` returns its JSON serialisation, `"csv"`
+                   returns a CSV string of transactions or holdings.
+    :param sort_transactions: For CAMS / KFin DETAILED statements, sort
+                              each scheme's transactions by date and
+                              re-compute the running balance. Default
+                              `True`.
+    :param force_pdfminer: **Deprecated.** v1.0 dropped pdfminer in
+                          favour of pypdfium2. Setting this to True
+                          emits a `DeprecationWarning` and is otherwise
+                          ignored.
+    :return: `CASData` for CAMS/KFin issuers, `NSDLCASData` for
+             NSDL/CDSL issuers, or a serialised form of either when
+             `output` is `"json"` / `"csv"`.
     """
     if force_pdfminer:
-        from .pdfminer import cas_pdf_to_text
-    else:
-        try:
-            from .mupdf import cas_pdf_to_text
-        except (ImportError, ModuleNotFoundError):
-            from .pdfminer import cas_pdf_to_text
-
-    partial_cas_data = cas_pdf_to_text(filename, password)
-    processed_data = process_cas_text(
-        "\u2029".join(partial_cas_data.lines), partial_cas_data.file_type
-    )
-    if isinstance(processed_data, ProcessedCASData):
-        if sort_transactions:
-            for folio in processed_data.folios:
-                for idx, scheme in enumerate(folio.schemes):
-                    dates = [x.date for x in scheme.transactions]
-                    sorted_dates = list(sorted(dates))
-                    if dates != sorted_dates:
-                        sorted_transactions = []
-                        balance = scheme.open
-                        for transaction in sorted(scheme.transactions, key=lambda x: x.date):
-                            balance += transaction.units or 0
-                            transaction.balance = balance
-                            sorted_transactions.append(transaction)
-                        scheme.transactions = sorted_transactions
-                    folio.schemes[idx] = scheme
-
-        final_data = CASData(
-            statement_period=processed_data.statement_period,
-            folios=processed_data.folios,
-            investor_info=partial_cas_data.investor_info,
-            cas_type=processed_data.cas_type,
-            file_type=partial_cas_data.file_type,
+        warnings.warn(
+            "force_pdfminer is deprecated in casparser 1.0 — pdfminer "
+            "is no longer a supported backend.",
+            DeprecationWarning,
+            stacklevel=2,
         )
-    else:
-        final_data = NSDLCASData(
-            statement_period=processed_data.statement_period,
-            accounts=processed_data.accounts,
-            investor_info=partial_cas_data.investor_info,
-            file_type=partial_cas_data.file_type,
+
+    # Open the PDF exactly once and thread it through the detect /
+    # parser / investor extractor calls — every pypdfium2 open re-runs
+    # the password decrypt + content-stream parse, so the savings on
+    # multi-page detailed statements are significant.
+    doc = _open_document(filename, password)
+
+    file_type = detect_file_type(filename, password, _doc=doc)
+    if file_type == FileType.UNKNOWN:
+        raise CASParseError(
+            "Could not identify the CAS issuer. Supported issuers are "
+            "CAMS, KFintech, NSDL, and CDSL."
         )
+
+    if file_type in (FileType.CAMS, FileType.KFINTECH):
+        cas_type = detect_cas_type(filename, password, _doc=doc)
+        if cas_type == CASFileType.DETAILED:
+            from . import cams_detailed
+
+            data: Union[CASData, NSDLCASData] = cams_detailed.parse(
+                filename,
+                password,
+                file_type=file_type,
+                _doc=doc,
+            )
+        elif cas_type == CASFileType.SUMMARY:
+            from . import cams_summary
+
+            data = cams_summary.parse(
+                filename,
+                password,
+                file_type=file_type,
+                _doc=doc,
+            )
+        else:
+            raise CASParseError(
+                "Could not identify whether this is a DETAILED or " "SUMMARY CAMS / KFin statement."
+            )
+        if sort_transactions and isinstance(data, CASData):
+            data = _sort_transactions(data)
+    elif file_type == FileType.NSDL:
+        from . import nsdl
+
+        data = nsdl.parse_nsdl(
+            filename,
+            password,
+            file_type=FileType.NSDL,
+            _doc=doc,
+        )
+    elif file_type == FileType.CDSL:
+        from . import cdsl
+
+        data = cdsl.parse_cdsl(
+            filename,
+            password,
+            file_type=FileType.CDSL,
+            _doc=doc,
+        )
+    else:  # pragma: no cover — handled above
+        raise CASParseError(f"Unsupported file type: {file_type}")
+
     if output == "dict":
-        return final_data
-    elif output == "csv":
-        return cas2csv(final_data)
-    return cas2json(final_data)
+        return data
+    if output == "csv":
+        return cas2csv(data)
+    return cas2json(data)
+
+
+__all__ = ["read_cas_pdf"]
diff --git a/casparser/parsers/_classify.py b/casparser/parsers/_classify.py
new file mode 100644
index 0000000..972e11c
--- /dev/null
+++ b/casparser/parsers/_classify.py
@@ -0,0 +1,114 @@
+"""Classification helpers shared across the CAMS / KFin parsers.
+
+Two pure utilities:
+
+- `get_transaction_type` maps a transaction description + signed units
+  count to a `TransactionType` enum, also extracting the dividend rate
+  for IDCW / dividend lines.
+- `get_parsed_scheme_name` normalises a raw scheme name (drops
+  `(formerly ...)`, `(erstwhile ...)`, `(Demat ...)` trailers, collapses
+  whitespace).
+
+These are pulled out of the old `casparser.process.cas_detailed` module
+because the pypdfium2 DETAILED parser still needs them but the rest of
+that module's text-rendering machinery is now gone.
+"""
+
+from __future__ import annotations
+
+import re
+from decimal import Decimal
+from typing import Optional, Tuple
+
+from casparser.enums import TransactionType
+
+# Matches an IDCW / dividend transaction description. Captures the
+# "reinvest" hint (if present) and the per-unit rupee value.
+DIVIDEND_RE = re.compile(
+    r"(?:div\.|dividend|idcw).+?(reinvest)*.*?@\s*Rs\.\s*([\d\.]+)(?:\s+per\s+unit)?",
+    re.I | re.DOTALL,
+)
+
+
+def get_transaction_type(
+    description: str, units: Optional[Decimal]
+) -> Tuple[TransactionType, Optional[Decimal]]:
+    """Classify a transaction by its description + units sign.
+
+    Returns `(transaction_type, dividend_rate_or_None)`. The dividend
+    rate is only set for IDCW / dividend transactions.
+    """
+    dividend_rate: Optional[Decimal] = None
+    description = description.lower()
+    if div_match := DIVIDEND_RE.search(description):
+        reinvest_flag, dividend_str = div_match.groups()
+        dividend_rate = Decimal(dividend_str)
+        txn_type = (
+            TransactionType.DIVIDEND_REINVEST if reinvest_flag else TransactionType.DIVIDEND_PAYOUT
+        )
+    elif units is None:
+        if "stt" in description:
+            txn_type = TransactionType.STT_TAX
+        elif "stamp" in description:
+            txn_type = TransactionType.STAMP_DUTY_TAX
+        elif "tds" in description:
+            txn_type = TransactionType.TDS_TAX
+        else:
+            txn_type = TransactionType.MISC
+    elif units > 0:
+        if "switch" in description:
+            txn_type = (
+                TransactionType.SWITCH_IN_MERGER
+                if "merger" in description
+                else TransactionType.SWITCH_IN
+            )
+        elif "segregat" in description:
+            txn_type = TransactionType.SEGREGATION
+        elif (
+            "sip" in description
+            or "systematic" in description
+            or re.search(r"instal+ment", description, re.I)
+            or re.search(r"sys.+?invest", description, re.I | re.DOTALL)
+        ):
+            txn_type = TransactionType.PURCHASE_SIP
+        else:
+            txn_type = TransactionType.PURCHASE
+    elif units < 0:
+        if re.search(
+            r"reversal|rejection|dishonoured|mismatch|insufficient\s+balance",
+            description,
+            re.I,
+        ):
+            txn_type = TransactionType.REVERSAL
+        elif "switch" in description:
+            txn_type = (
+                TransactionType.SWITCH_OUT_MERGER
+                if "merger" in description
+                else TransactionType.SWITCH_OUT
+            )
+        else:
+            txn_type = TransactionType.REDEMPTION
+    else:
+        txn_type = TransactionType.UNKNOWN
+
+    return txn_type, dividend_rate
+
+
+def get_parsed_scheme_name(scheme: str) -> str:
+    """Strip `(formerly ...)`, `(erstwhile ...)`, `(Demat ...)`,
+    `(Non-Demat ...)` trailers; collapse whitespace; trim trailing
+    punctuation."""
+    scheme = re.sub(
+        r"\((formerly|erstwhile).+?\)",
+        "",
+        scheme,
+        flags=re.I | re.DOTALL,
+    ).strip()
+    scheme = re.sub(
+        r"\((Demat|Non-Demat).*",
+        "",
+        scheme,
+        flags=re.I | re.DOTALL,
+    ).strip()
+    scheme = re.sub(r"\s+", " ", scheme).strip()
+    return re.sub(r"[^a-zA-Z0-9_)]+$", "", scheme).strip()
diff --git a/casparser/parsers/_investor.py b/casparser/parsers/_investor.py
new file mode 100644
index 0000000..e8ec246
--- /dev/null
+++ b/casparser/parsers/_investor.py
@@ -0,0 +1,192 @@
+"""Investor-info extractors for the four supported CAS issuers.
+
+Both extractors filter the source PDF's atoms to a top-left column on
+a known page (page 1 for CAMS/KFin, page 2 for NSDL/CDSL), then walk
+top-down picking out labelled fields. We use page-object atoms rather
+than baseline-clustered lines so the right-column disclaimer text
+that shares y-baselines with the investor block doesn't contaminate
+the result.
+
+The CAMS/KFin block carries the full quartet (name, email, address,
+mobile). The NSDL/CDSL block carries only the name and address —
+those CAS variants don't print the investor's email or mobile on the
+statement, so those fields come back as empty strings.
+"""
+
+from __future__ import annotations
+
+import re
+from typing import TYPE_CHECKING, List, Optional
+
+from casparser.exceptions import CASParseError
+from casparser.types import InvestorInfo
+
+from .pageobj import Atom, extract_atoms
+
+if TYPE_CHECKING:  # pragma: no cover
+    import pypdfium2 as pdfium
+
+
+# Top-left column cutoffs. Everything to the right is the disclaimer
+# paragraph (CAMS/KFin) or the cover-page banner (NSDL/CDSL). 200 is
+# the conservative right edge that fits all observed templates.
+_LEFT_COLUMN_X = 200.0
+
+
+_EMAIL_RE = re.compile(r"Email\s*Id\s*:\s*(\S+@\S+)", re.I)
+_MOBILE_RE = re.compile(r"Mobile\s*:\s*([+\d]+)", re.I)
+_PHONE_RE = re.compile(r"^\s*Phone\s+Off\s*:", re.I)
+_PINCODE_RE = re.compile(r"^\s*(?:Pin\s*code|PINCODE)\s*:\s*\d+", re.I)
+_ID_MARKER_RE = re.compile(r"^\s*(?:CAS|NSDL)\s*ID\s*:", re.I)
+
+
+def _left_column_atoms(atoms: List[Atom]) -> List[Atom]:
+    """Filter to atoms in the top-left column, sorted top-down."""
+    filtered = [a for a in atoms if a.x_left < _LEFT_COLUMN_X and a.text.strip()]
+    filtered.sort(key=lambda a: -a.y_top)
+    return filtered
+
+
+def extract_cams_kfin_investor(
+    pdf_path,
+    password,
+    *,
+    _doc: "Optional[pdfium.PdfDocument]" = None,
+    _atoms: Optional[List[List[Atom]]] = None,
+) -> InvestorInfo:
+    """Read the investor block from the top-left of page 1.
+
+    Layout across CAMS and KFin templates:
+
+      Email Id: <email>
+      <Investor Name>
+      <Address line 1>
+      ...
+      <Address line N>
+      [Phone Off: ...]                  ← only on some KFin templates
+      Mobile: <mobile>
+
+    We anchor on `Email Id:` (always present on CAMS/KFin), then
+    everything until `Mobile:` (exclusive) is name + address. The
+    name is the first non-label line; the rest is address. Stray
+    `Phone Off:` lines are dropped from the address.
+
+    Every CAS statement carries this block by mandate. If we can't
+    find it we raise `CASParseError` — a CAS without identifiable
+    investor is malformed, not a "missing field" case.
+
+    `_doc` / `_atoms`: dispatcher-provided overrides to avoid a
+    second pypdfium2 open + page-object walk when the caller has
+    already extracted atoms for the holdings parser.
+    """
+    pages = (
+        _atoms
+        if _atoms is not None
+        else extract_atoms(
+            pdf_path,
+            password,
+            _doc=_doc,
+        )
+    )
+    block = _left_column_atoms(pages[0]) if pages else []
+
+    email = ""
+    mobile = ""
+    name = ""
+    address_lines: List[str] = []
+    seen_email = False
+
+    for atom in block:
+        text = atom.text.strip()
+        if m := _EMAIL_RE.match(text):
+            email = m.group(1).strip()
+            seen_email = True
+            continue
+        if m := _MOBILE_RE.match(text):
+            mobile = m.group(1).strip()
+            # Mobile is the last field of the investor block — stop here
+            # so the transaction table that follows isn't picked up.
+            break
+        if not seen_email:
+            continue
+        if _PHONE_RE.match(text):
+            continue
+        if not name:
+            name = text
+        else:
+            address_lines.append(text)
+
+    if not name:
+        raise CASParseError(
+            "Could not extract investor info from CAMS/KFin CAS PDF. "
+            "Expected an `Email Id:` line followed by name + address + "
+            "`Mobile:` in the top-left column of page 1."
+        )
+    return InvestorInfo(
+        name=name,
+        email=email,
+        address="\n".join(address_lines),
+        mobile=mobile,
+    )
+
+
+def extract_nsdl_cdsl_investor(
+    pdf_path,
+    password,
+    *,
+    _doc: "Optional[pdfium.PdfDocument]" = None,
+    _atoms: Optional[List[List[Atom]]] = None,
+) -> InvestorInfo:
+    """NSDL / CDSL print the investor block on page 2 (after the cover
+    page). The block is delimited by a `CAS ID:` (CDSL) or `NSDL ID:`
+    (NSDL) marker on top and a `PINCODE:` line on the bottom. Name is
+    the first line after the marker; everything between is address.
+    Email and mobile aren't printed in these CAS variants, so they
+    come back as empty strings.
+
+    Raises `CASParseError` if no investor block is found — a CAS
+    without identifiable investor is malformed.
+
+    `_doc` / `_atoms`: dispatcher-provided overrides; see
+    `extract_cams_kfin_investor`.
+    """
+    pages = (
+        _atoms
+        if _atoms is not None
+        else extract_atoms(
+            pdf_path,
+            password,
+            _doc=_doc,
+        )
+    )
+    block = _left_column_atoms(pages[1]) if len(pages) >= 2 else []
+
+    name = ""
+    address_lines: List[str] = []
+    seen_marker = False
+    for atom in block:
+        text = atom.text.strip()
+        if _ID_MARKER_RE.match(text):
+            seen_marker = True
+            continue
+        if not seen_marker:
+            continue
+        if not name:
+            name = text
+            continue
+        address_lines.append(text)
+        if _PINCODE_RE.match(text):
+            break
+
+    if not name:
+        raise CASParseError(
+            "Could not extract investor info from NSDL/CDSL CAS PDF. "
+            "Expected a `CAS ID:` / `NSDL ID:` marker followed by name + "
+            "address in the top-left column of page 2."
+        )
+    return InvestorInfo(
+        name=name,
+        email="",
+        address="\n".join(address_lines),
+        mobile="",
+    )
diff --git a/casparser/parsers/_isin.py b/casparser/parsers/_isin.py
new file mode 100644
index 0000000..edcc6db
--- /dev/null
+++ b/casparser/parsers/_isin.py
@@ -0,0 +1,40 @@
+from typing import Optional, Tuple
+
+from casparser_isin import MFISINDb
+
+
+def isin_search(
+    scheme_name: str,
+    rta: str,
+    rta_code: str,
+    isin: Optional[str] = None,
+) -> Tuple[Optional[str], Optional[str], Optional[str]]:
+    """Look up `(ISIN, AMFI, type)` for a CAS scheme.
+
+    The primary path matches on `(scheme_name, rta, rta_code)`. When
+    that returns no hit but the caller passed an `isin` (e.g., parsed
+    inline from the scheme header), fall back to a direct ISIN lookup.
+    The fallback bypasses RTA mis-detection that can happen when the
+    `Registrar:` value gets mangled by multi-line rendering on
+    pypdfium2's char extraction.
+
+    :param scheme_name: Normalised scheme name from the CAS.
+    :param rta: Registrar (`CAMS` / `KFINTECH` / `FTAMIL` …).
+    :param rta_code: Scheme's per-RTA code.
+    :param isin: Optional ISIN hint pulled from the scheme header.
+    """
+    with MFISINDb() as db:
+        try:
+            scheme_data = db.isin_lookup(scheme_name, rta, rta_code, isin=isin)
+            return scheme_data.isin, scheme_data.amfi_code, scheme_data.type
+        except ValueError:
+            pass
+        if isin:
+            try:
+                rows = db.direct_isin_lookup(isin)
+                if rows:
+                    row = rows[0]
+                    return row["isin"], row["amfi_code"], row["type"]
+            except (ValueError, KeyError, TypeError):
+                pass
+    return None, None, None
diff --git a/casparser/parsers/cams_detailed.py b/casparser/parsers/cams_detailed.py
new file mode 100644
index 0000000..b79d487
--- /dev/null
+++ b/casparser/parsers/cams_detailed.py
@@ -0,0 +1,546 @@
+"""POC: CAMS DETAILED CAS parser using column-based row reading.
+
+Produces the same `List[Folio]` shape as the production parser so output can
+be diffed directly. ISIN/AMFI enrichment and investor info are deferred —
+those passes are orthogonal to the column-reader question.
+
+Scope of this POC (handles):
+- One CAS, possibly multi-page
+- One AMC, one folio header per folio, one scheme header per scheme
+- Transaction table with 6 standard columns (Date / Transaction / Amount /
+  Units / Price / Unit Balance)
+- "Opening Unit Balance", "Closing Unit Balance", "NAV on", "Valuation on"
+  labeled rows
+
+Deferred (TODO markers below):
+- Multi-line transaction descriptions (we keep first line only)
+- ISIN / AMFI lookup
+- Nominees
+- Segregated portfolios
+- Total Cost Value parsing
+- Investor info / statement period
+"""
+
+from __future__ import annotations
+
+import re
+from dataclasses import dataclass
+from decimal import Decimal
+from typing import List, Optional
+
+from dateutil import parser as dateparse
+
+from casparser.enums import CASFileType, FileType
+from casparser.types import (
+    CASData,
+    Folio,
+    Scheme,
+    SchemeValuation,
+    StatementPeriod,
+    TransactionData,
+)
+
+from ._classify import get_parsed_scheme_name, get_transaction_type
+from ._investor import extract_cams_kfin_investor
+from ._isin import isin_search
+from .extract import Char, Line, extract_pages
+
+# -----------------------------------------------------------------------------
+# Column anchors
+# -----------------------------------------------------------------------------
+
+# CAMS DETAILED transaction table. The header is two physical rows in the
+# PDF: "Date Transaction Amount Units Price Unit" on top, "(INR) (INR)
+# Balance" below. We require ≥4 of these labels on one line.
+TXN_HEADER_LABELS = {"Date", "Transaction", "Amount", "Units", "Price", "Unit", "Balance", "NAV"}
+TXN_MIN_HITS = 4
+
+# All numeric columns are right-aligned; Date and Transaction are left-aligned.
+ALIGN = {
+    "Date": "left",
+    "Transaction": "left",
+    "Amount": "right",
+    "Units": "right",
+    "Price": "right",
+    "Unit Balance": "right",
+    "NAV": "right",
+}
+
+
+@dataclass
+class Column:
+    label: str
+    x_lo: float  # range covering header label width
+    x_hi: float
+    alignment: str  # 'left' | 'right'
+
+    @property
+    def x_anchor(self) -> float:
+        """For right-aligned columns, x_hi is the snap target; for left,
+        x_lo is."""
+        return self.x_hi if self.alignment == "right" else self.x_lo
+
+
+def _words_on_line(line: Line, min_gap: float = 1.5) -> List[tuple[str, float, float]]:
+    """Return [(text, x0, x1)] words on a line, splitting on x-gap > min_gap."""
+    cs = sorted(line.chars, key=lambda c: c.x0)
+    words = []
+    cur, cur_x0, cur_x1 = "", None, None
+    for c in cs:
+        if cur and (c.x0 - cur_x1) > min_gap:
+            words.append((cur, cur_x0, cur_x1))
+            cur = ""
+        if not cur:
+            cur_x0 = c.x0
+        cur += c.text
+        cur_x1 = c.x1
+    if cur:
+        words.append((cur, cur_x0, cur_x1))
+    return words
+
+
+HEADER_WINDOW_Y = 15.0  # vertical span (pts) that constitutes one logical
+# header block. CAMS uses 2 baselines spanning ~10pt; KFin uses 4 baselines
+# spanning ~11pt (Amount/Price at top, Unit, Date/Transaction/Units, (INR)
+# /(INR)/Balance at bottom).
+
+
+def detect_txn_columns(lines: List[Line], start_idx: int) -> Optional[tuple[int, List[Column]]]:
+    """Find the next transaction-table header at or after start_idx.
+
+    A header is a y-window of consecutive lines (top-down) spanning ≤ HEADER_
+    WINDOW_Y points and collectively containing ≥ TXN_MIN_HITS distinct
+    column labels. We collect labels from the whole window so wraps like
+    "Unit"/"Balance" stacked over 2 baselines or KFin's 4-baseline split
+    behave the same.
+
+    Returns (index_of_last_line_in_header, ordered columns). Transaction
+    parsing should start at index + 1.
+    """
+    for i in range(start_idx, len(lines)):
+        window = [lines[i]]
+        for j in range(i + 1, len(lines)):
+            if lines[i].baseline - lines[j].baseline > HEADER_WINDOW_Y:
+                break
+            window.append(lines[j])
+
+        all_words: List[tuple[str, float, float]] = []
+        for line in window:
+            all_words.extend(_words_on_line(line))
+        labels = {w[0] for w in all_words if w[0] in TXN_HEADER_LABELS}
+        if len(labels) < TXN_MIN_HITS:
+            continue
+        last_idx = i + len(window) - 1
+        return last_idx, _build_columns(all_words)
+    return None
+
+
+def _build_columns(words: List[tuple[str, float, float]]) -> List[Column]:
+    """Map header words to Columns. Merge "Unit"+"Balance" into one column."""
+    cols: List[Column] = []
+    used = set()
+    for text, x0, x1 in words:
+        if text == "Unit" and ("Balance" in (w[0] for w in words)):
+            # Find "Balance" with overlapping x-range
+            for w_text, w_x0, w_x1 in words:
+                if w_text == "Balance" and abs((w_x0 + w_x1) / 2 - (x0 + x1) / 2) < 30:
+                    cols.append(Column("Unit Balance", min(x0, w_x0), max(x1, w_x1), "right"))
+                    used.add(id((text, x0, x1)))
+                    used.add(id((w_text, w_x0, w_x1)))
+                    break
+        elif text in ALIGN and text not in ("Unit", "Balance"):
+            cols.append(Column(text, x0, x1, ALIGN[text]))
+    cols.sort(key=lambda c: c.x_lo)
+    return cols
+
+
+NUMERIC_ZONE_WIDTH = 55.0  # pts; right-aligned numeric values sit within
+# this width to the left of the column's x_hi. Wide enough for any common
+# Indian-format amount (e.g. "1,23,45,678.90") but narrow enough to exclude
+# wrapped description text that bleeds in from the left.
+
+
+def _column_ranges(columns: List[Column]) -> List[tuple[Column, float, float]]:
+    """Compute x-range per column. Right-aligned numeric columns get a
+    fixed-width zone ending at x_hi. Left-aligned columns extend from x_lo to
+    the start of the next column's zone.
+
+    The fundamental asymmetry: description text (Transaction column) is wide
+    and naturally extends into the Amount column's x-space, while the actual
+    amount value is in a narrow zone right-aligned to x_hi. Hence numeric
+    columns are bounded by content-width, not by midpoint to neighbors.
+    """
+    sorted_cols = sorted(columns, key=lambda c: (c.x_lo + c.x_hi) / 2)
+    ranges: List[tuple[Column, float, float]] = []
+    for i, col in enumerate(sorted_cols):
+        if col.alignment == "right":
+            lo = col.x_hi - NUMERIC_ZONE_WIDTH
+            hi = col.x_hi + 3.0
+        else:
+            lo = col.x_lo - 3.0
+            if i + 1 < len(sorted_cols):
+                nxt = sorted_cols[i + 1]
+                hi = nxt.x_hi - NUMERIC_ZONE_WIDTH if nxt.alignment == "right" else nxt.x_lo - 3.0
+            else:
+                hi = float("inf")
+        ranges.append((col, lo, hi))
+    return ranges
+
+
+def assign_cells(line: Line, columns: List[Column]) -> dict[str, str]:
+    """Bucket each char into a column by x-midpoint, then render each cell
+    text in left-to-right order. Overlay duplicates are already filtered
+    upstream by ``extract.extract_pages`` at the atom level."""
+    ranges = _column_ranges(columns)
+    cells: dict[str, list[Char]] = {c.label: [] for c in columns}
+    for ch in line.chars:
+        x_mid = (ch.x0 + ch.x1) / 2
+        for col, lo, hi in ranges:
+            if lo <= x_mid < hi:
+                cells[col.label].append(ch)
+                break
+    out = {}
+    for label, chars in cells.items():
+        if not chars:
+            continue
+        chars.sort(key=lambda c: c.x0)
+        heights = sorted(c.h for c in chars)
+        h_med = heights[len(heights) // 2]
+        gap = max(1.5, 0.6 * h_med)
+        parts, prev_x1 = [], None
+        for c in chars:
+            if prev_x1 is not None and (c.x0 - prev_x1) > gap:
+                parts.append(" ")
+            parts.append(c.text)
+            prev_x1 = c.x1
+        out[label] = "".join(parts).strip()
+    return out
+
+
+# -----------------------------------------------------------------------------
+# Label parsers (folio/scheme/labeled rows)
+# -----------------------------------------------------------------------------
+
+FOLIO_LINE_RE = re.compile(
+    # Folio format: <digits> with optional " / <digits>" sub-account
+    # suffix. Spaces around the slash are common in the source PDF.
+    # Each of PAN / KYC / PAN-KYC is optional but when present
+    # appears in this order on the same line. `.*?` lives *inside*
+    # the optional group so a non-greedy match doesn't skip past it
+    # and leave the capture empty.
+    r"Folio\s+No\s*:\s*(\d+(?:\s*/\s*\d+)?)"
+    r"(?:.*?PAN\s*:\s*([A-Z]{5}\d{4}[A-Z]))?"
+    r"(?:.*?KYC\s*:\s*(OK|NOT OK))?"
+    r"(?:.*?PAN\s*:\s*(OK|NOT OK))?",
+    re.I,
+)
+SCHEME_HEAD_RE = re.compile(
+    # `<CODE>-<NAME> Registrar:<RTA>`. The `<NAME>` chunk may carry
+    # inline `(Advisor: <ARN>)` and `- ISIN: <ISIN>` segments in either
+    # order — newer KFin templates put `(Advisor:...) - ISIN:...`,
+    # newer CAMS templates put `- ISIN: ...(Advisor: ...)`. We capture
+    # everything between code and Registrar as `name` and then strip
+    # the advisor / ISIN fragments out in a second pass.
+    r"^(?P<code>[\w\s]+?)-\s*(?P<name>.+?)" r"\s+Registrar\s*:\s*(?P<rta>\S+)",
+    re.I,
+)
+INLINE_ISIN_RE = re.compile(r"[-\s]*ISIN\s*:\s*([A-Z0-9]+)", re.I)
+INLINE_ADVISOR_RE = re.compile(r"[-\s]*\(\s*Advisor\s*:\s*([^)]+?)\)", re.I)
+SCHEME_HEAD_RTA_RE = re.compile(r"Registrar\s*:\s*(\S+)", re.I)
+OPEN_BAL_RE = re.compile(r"Opening\s+Unit\s+Balance\s*:?\s*([\d,.]+)", re.I)
+CLOSE_BAL_RE = re.compile(r"Closing\s+Unit\s+Balance\s*:?\s*([\d,.]+)", re.I)
+NAV_RE = re.compile(r"NAV\s+on\s+(\d{2}-[A-Za-z]{3}-\d{4})\s*:\s*INR\s*([\d,.]+)", re.I)
+VALUATION_RE = re.compile(
+    r"(?:Valuation|Market\s+Value)\s+on\s+(\d{2}-[A-Za-z]{3}-\d{4})\s*:\s*INR\s*([\d,.]+)",
+    re.I,
+)
+COST_VALUE_RE = re.compile(r"Total\s+Cost\s+Value\s*:?\s*([\d,.]+)", re.I)
+# Nominee block on the folio header. Three optional name slots; an
+# empty slot ("Nominee 2: ") means no nominee at that position.
+NOMINEE_RE = re.compile(
+    r"Nominee\s+1\s*:\s*(?P<n1>[^:]*?)\s*(?:Nominee\s+2\s*:\s*(?P<n2>[^:]*?)\s*"
+    r"(?:Nominee\s+3\s*:\s*(?P<n3>.*?))?)?$",
+    re.I,
+)
+STMT_PERIOD_RE = re.compile(
+    r"(\d{2}-[A-Za-z]{3}-\d{4})\s+To\s+(\d{2}-[A-Za-z]{3}-\d{4})",
+    re.I,
+)
+# AMC header line. Most issuers end in "Mutual Fund" or "MF"; a few
+# newer entrants use "<X> Fund House" instead. We anchor on the
+# trailing suffix so disclaimer paragraphs that happen to mention an
+# AMC name mid-sentence don't get classified as section headers.
+AMC_RE = re.compile(
+    r"^(.+?\s+(?:MF|Mutual\s*Fund|Fund\s*House))$",
+    re.I,
+)
+# Extract leading date pattern. Accept "25-Oct-2021", "25 Oct 2021",
+# "25Oct2021", etc. Dashes sometimes sit on a different baseline. The
+# regex anchors only at start so it survives stray trailing chars
+# (e.g. KFin's instalment number "1" leaking from the description column).
+DATE_CELL_RE = re.compile(r"^\s*(\d{1,2}[-\s]*[A-Za-z]{3}[-\s]*\d{4})")
+
+
+def _decimal(s: str) -> Optional[Decimal]:
+    if s is None:
+        return None
+    s = s.strip()
+    if not s:
+        return None
+    neg = s.startswith("(") or s.startswith("-")
+    s = s.lstrip("(").rstrip(")").lstrip("-").replace(",", "")
+    try:
+        d = Decimal(s)
+        return -d if neg else d
+    except Exception:
+        return None
+
+
+# -----------------------------------------------------------------------------
+# Top-level parse
+# -----------------------------------------------------------------------------
+
+
+def parse(
+    pdf_path: str,
+    password: str,
+    file_type: FileType = FileType.UNKNOWN,
+    *,
+    _doc=None,
+) -> CASData:
+    pages = extract_pages(pdf_path, password, _doc=_doc)
+
+    statement_period: Optional[StatementPeriod] = None
+    folios: dict[str, Folio] = {}
+    current_amc: Optional[str] = None
+    current_folio: Optional[Folio] = None
+    current_scheme: Optional[Scheme] = None
+    last_columns: List[Column] = []  # inherited if current page lacks header
+
+    for page in pages:
+        header_pos = detect_txn_columns(page.lines, 0)
+        if header_pos:
+            header_idx, columns = header_pos
+            last_columns = columns
+        else:
+            # Continuation page — no header. Inherit from previous.
+            # header_idx=-1 means transactions can start from line 0.
+            header_idx = -1
+            columns = last_columns
+
+        for i, line in enumerate(page.lines):
+            text = line.text
+
+            # --- statement period (first page only) ---
+            if statement_period is None:
+                if m := STMT_PERIOD_RE.search(text):
+                    statement_period = StatementPeriod(from_=m.group(1), to=m.group(2))
+
+            # --- AMC ---
+            if m := AMC_RE.match(text.strip()):
+                current_amc = m.group(0)
+                continue
+
+            # --- Folio header ---
+            if "Folio No" in text and (m := FOLIO_LINE_RE.search(text)):
+                # Preserve internal " / " for compatibility with production
+                # parser output format (it keeps "12124203 / 63" style).
+                folio_no = m.group(1).strip()
+                if folio_no not in folios:
+                    folios[folio_no] = Folio(
+                        folio=folio_no,
+                        amc=current_amc or "UNKNOWN",
+                        PAN=m.group(2) or "",
+                        KYC=m.group(3) or None,
+                        PANKYC=m.group(4) or None,
+                        schemes=[],
+                    )
+                current_folio = folios[folio_no]
+                current_scheme = None
+                continue
+
+            # --- Scheme header ---
+            # The scheme block can span up to 3 baselines depending on AMC
+            # and statement template:
+            #
+            #   Older CAMS:                            Newer CAMS:
+            #   <code>-<name> ... Registrar : CAMS    Registrar :
+            #   WEALTH)                                <code>-<name> ... (Advisor:...)
+            #                                          KFINTECH
+            #
+            # We stitch up to 2 lines above and 2 lines below the
+            # current line (within Y_BAND pts y-distance) if those
+            # adjacent lines contain Registrar / Advisor / ISIN markers
+            # or look like the standalone RTA value (CAMS / KFINTECH).
+            Y_BAND = 5.0
+            if current_folio is not None and "-" in text:
+                parts_above = []
+                parts_below = []
+                base_y = page.lines[i].baseline
+                for offset in (1, 2):
+                    j = i - offset
+                    if j < 0:
+                        break
+                    if page.lines[j].baseline - base_y > Y_BAND:
+                        break
+                    t_above = page.lines[j].text.strip()
+                    if re.fullmatch(r"Registrar\s*:?", t_above, re.I) or re.search(
+                        r"Registrar\s*:|Advisor\s*:|ISIN\s*:", t_above, re.I
+                    ):
+                        parts_above.insert(0, t_above)
+                # When the scheme line ENDS with an incomplete trailing
+                # marker (e.g. "(Advisor: Registrar :"), take the next
+                # baseline below as the value continuation regardless of
+                # its content — the value tokens (ARN-XYZ, INAxxxxx,
+                # CAMS, KFINTECH) don't all match a fixed pattern.
+                trailing_incomplete = bool(
+                    re.search(
+                        r"(Registrar\s*:|Advisor\s*:|ISIN\s*:|\(\s*Advisor\s*:)\s*$",
+                        text.strip(),
+                        re.I,
+                    )
+                )
+                for offset in (1, 2):
+                    j = i + offset
+                    if j >= len(page.lines):
+                        break
+                    if base_y - page.lines[j].baseline > Y_BAND:
+                        break
+                    t_below = page.lines[j].text.strip()
+                    if (
+                        re.fullmatch(r"(CAMS|KFINTECH|KFIN)\)?", t_below, re.I)
+                        or re.search(r"Registrar\s*:|Advisor\s*:|ISIN\s*:", t_below, re.I)
+                        or (offset == 1 and trailing_incomplete)
+                    ):
+                        parts_below.append(t_below)
+                # Scheme line FIRST so SCHEME_HEAD_RE can anchor to `<code>-`.
+                # Then append annotations from any direction.
+                scheme_text = " ".join([text.strip()] + parts_above + parts_below)
+                # Trailing "Registrar :" with value already on the next
+                # token after stitching → ensure value present.
+                if scheme_text.endswith("Registrar :") or scheme_text.endswith("Registrar:"):
+                    if i + 1 < len(page.lines):
+                        toks = page.lines[i + 1].text.split()
+                        if toks:
+                            scheme_text = scheme_text + " " + toks[0]
+                if "Registrar" in scheme_text and (m := SCHEME_HEAD_RE.match(scheme_text)):
+                    code = m.group("code").strip()
+                    raw_name = m.group("name")
+                    # Pull `(Advisor: …)` and `- ISIN: …` out of name
+                    # (templates emit them in either order). Capture
+                    # values first, then `re.sub` both fragments so we
+                    # don't have to track shifted span offsets.
+                    isin_m = INLINE_ISIN_RE.search(raw_name)
+                    inline_isin = isin_m.group(1).strip() if isin_m else None
+                    adv_m = INLINE_ADVISOR_RE.search(raw_name)
+                    advisor = adv_m.group(1).strip() if adv_m else None
+                    raw_name = INLINE_ISIN_RE.sub("", raw_name)
+                    raw_name = INLINE_ADVISOR_RE.sub("", raw_name)
+                    name = get_parsed_scheme_name(raw_name)
+                    rta = (m.group("rta") or "").strip() or "CAMS"
+                    isin, amfi, scheme_type = isin_search(
+                        name,
+                        rta,
+                        code,
+                        isin=inline_isin,
+                    )
+                    current_scheme = Scheme(
+                        scheme=name,
+                        advisor=advisor,
+                        rta=rta,
+                        rta_code=code,
+                        isin=isin,
+                        amfi=amfi,
+                        type=scheme_type or "N/A",
+                        open=Decimal(0),
+                        close=Decimal(0),
+                        close_calculated=Decimal(0),
+                        valuation=SchemeValuation(
+                            date=statement_period.to if statement_period else "1970-01-01",
+                            nav=Decimal(0),
+                            value=Decimal(0),
+                        ),
+                        transactions=[],
+                    )
+                    current_folio.schemes.append(current_scheme)
+                    continue
+
+            if current_scheme is None:
+                continue
+
+            # --- Labeled rows ---
+            if m := OPEN_BAL_RE.search(text):
+                current_scheme.open = _decimal(m.group(1)) or Decimal(0)
+                current_scheme.close_calculated = current_scheme.open
+                continue
+            if m := CLOSE_BAL_RE.search(text):
+                current_scheme.close = _decimal(m.group(1)) or Decimal(0)
+            if m := NAV_RE.search(text):
+                current_scheme.valuation.date = dateparse.parse(m.group(1)).date()
+                current_scheme.valuation.nav = _decimal(m.group(2)) or Decimal(0)
+            if m := VALUATION_RE.search(text):
+                current_scheme.valuation.date = dateparse.parse(m.group(1)).date()
+                current_scheme.valuation.value = _decimal(m.group(2)) or Decimal(0)
+            if m := COST_VALUE_RE.search(text):
+                current_scheme.valuation.cost = _decimal(m.group(1))
+            if m := NOMINEE_RE.search(text):
+                noms = [
+                    (m.group("n1") or "").strip(),
+                    (m.group("n2") or "").strip(),
+                    (m.group("n3") or "").strip(),
+                ]
+                current_scheme.nominees = [n for n in noms if n]
+
+            # --- Transaction row (only when we have columns AND we're past
+            #     the header block on this page) ---
+            if columns and header_idx is not None and i > header_idx:
+                cells = assign_cells(line, columns)
+                date_str = cells.get("Date", "").strip()
+                desc = cells.get("Transaction", "").strip()
+                m_date = DATE_CELL_RE.match(date_str)
+                if not m_date:
+                    continue
+                if not desc:
+                    continue  # row with date but no description: skip
+                date_str = m_date.group(1)
+                # Normalize: collapse runs of dashes/spaces from overlay
+                # bleed-through, e.g. "15--Jan--2021" -> "15-Jan-2021".
+                date_str = re.sub(r"[-\s]+", "-", date_str).strip("-")
+                amt = _decimal(cells.get("Amount", ""))
+                units = _decimal(cells.get("Units", ""))
+                nav = _decimal(cells.get("Price", "") or cells.get("NAV", ""))
+                bal = _decimal(cells.get("Unit Balance", ""))
+                # A row with no amount AND no units is not a real transaction
+                # (usually a stray date in a footnote like "Effective from
+                # 01-Apr-2019…"). Skip these.
+                if amt is None and units is None:
+                    continue
+                # Some older CAMS / KFin templates omit the per-row Price
+                # column for transactions but always carry Amount + Units.
+                # Derive `nav = amount / units` so downstream capital-gains
+                # FIFO calculations don't crash on `nav=None`.
+                if nav is None and amt is not None and units is not None and units != 0:
+                    nav = (amt / units).quantize(Decimal("0.0001"))
+                txn_type, dividend_rate = get_transaction_type(desc, units)
+                if units is not None:
+                    current_scheme.close_calculated += units
+                current_scheme.transactions.append(
+                    TransactionData(
+                        date=dateparse.parse(date_str).date(),
+                        description=desc,
+                        amount=amt,
+                        units=units,
+                        nav=nav,
+                        balance=bal,
+                        type=txn_type.name,
+                        dividend_rate=dividend_rate,
+                    )
+                )
+
+    return CASData(
+        statement_period=statement_period or StatementPeriod(**{"from": "", "to": ""}),
+        folios=list(folios.values()),
+        investor_info=extract_cams_kfin_investor(pdf_path, password, _doc=_doc),
+        cas_type=CASFileType.DETAILED,
+        file_type=file_type,
+    )
diff --git a/casparser/parsers/cams_summary.py b/casparser/parsers/cams_summary.py
new file mode 100644
index 0000000..7495547
--- /dev/null
+++ b/casparser/parsers/cams_summary.py
@@ -0,0 +1,436 @@
+"""POC: CAMS/KFin SUMMARY CAS parser using column-based row reading.
+
+Same architecture as `cams_detailed`, simpler schema — each scheme is
+ONE row (no transactions). Schemes can wrap to one or two continuation
+lines below for long names.
+
+Row anatomy (CAMS, single line where possible):
+  <folio> <ISIN> <rta_code>-<scheme name> <cost> <balance> <NAV date>
+  <NAV> <market value> <RTA>
+
+KFin uses the same fields but renders the header across 2-3 baselines
+("Cost Value | Closing Unit Balance | Price | Market Value" on top,
+"Folio No. | ISIN | Scheme Name | NAV Date" below).
+
+Produces the same `POCResult` shape as `cams_detailed.parse` so output
+can be diffed directly against production `casparser.read_cas_pdf`.
+"""
+
+from __future__ import annotations
+
+import re
+from decimal import Decimal
+from typing import List, Optional
+
+from dateutil import parser as dateparse
+
+from casparser.enums import CASFileType, FileType
+from casparser.types import (
+    CASData,
+    Folio,
+    Scheme,
+    SchemeValuation,
+    StatementPeriod,
+)
+
+from ._investor import extract_cams_kfin_investor
+from ._isin import isin_search
+from .cams_detailed import AMC_RE, Column, _decimal
+from .extract import Char, Line, extract_pages
+
+# -----------------------------------------------------------------------------
+# Column anchors
+# -----------------------------------------------------------------------------
+
+# Header keywords used by both CAMS and KFin SUMMARY templates. We accept
+# either dialect ("Unit Balance" / "Closing Unit Balance" for the units
+# column, "NAV" / "Price" for per-unit value). Whichever label appears in
+# the header row, we map it to a canonical column key.
+SUMMARY_HEADER_LABELS = {
+    "Folio",
+    "No",
+    "No.",
+    "ISIN",
+    "Scheme",
+    "Name",
+    "Cost",
+    "Value",
+    "Unit",
+    "Balance",
+    "Closing",
+    "NAV",
+    "Date",
+    "Price",
+    "Market",
+    "Registrar",
+}
+SUMMARY_MIN_HITS = 5  # 5 distinct header words to call it a header block
+
+HEADER_WINDOW_Y = 15.0  # same as DETAILED — header may span up to ~15pt y
+
+# Column identity rules. Given the SET of words within one x-cluster of
+# the header (across all baselines), pick the canonical column whose
+# required tokens are all present. Tried in priority order — the first
+# match wins. Some clusters have noise tokens like "(INR)" which we
+# just ignore. Order of words within a cluster doesn't matter, which
+# matters for KFin: it renders "Closing" + "Unit" on one baseline above
+# "Balance" on another, and when sorted by x they come out interleaved.
+COLUMN_RULES = [
+    # (required tokens, optional tokens, canonical label, alignment)
+    ({"Folio"}, {"No.", "No"}, "Folio", "left"),
+    ({"ISIN"}, set(), "ISIN", "left"),
+    ({"Scheme"}, {"Name"}, "Scheme", "left"),
+    ({"Cost"}, {"Value"}, "Cost", "right"),
+    ({"Closing", "Balance"}, {"Unit"}, "Balance", "right"),
+    ({"Unit", "Balance"}, set(), "Balance", "right"),
+    ({"NAV", "Date"}, set(), "NAVDate", "left"),
+    ({"NAV"}, {"Value"}, "NAV", "right"),
+    ({"Price"}, set(), "NAV", "right"),
+    ({"Market"}, {"Value"}, "MarketValue", "right"),
+    ({"Registrar"}, set(), "Registrar", "left"),
+]
+
+XCLUSTER_GAP = 7.0  # pts; gap larger than this between adjacent words
+# (sorted by x, across all header baselines) starts a new cluster. KFin's
+# headers have legitimate column separators as tight as ~9pt (Market →
+# Registrar), so we need a smaller threshold than typical word spacing.
+
+
+def _words_on_line(line: Line, min_gap: float = 1.5) -> List[tuple[str, float, float]]:
+    """Split a line into words by x-gap OR by literal whitespace chars.
+    CAMS SUMMARY header inserts an actual ' ' Char between "Folio" and
+    "No.", so x-gap alone won't separate them."""
+    cs = sorted(line.chars, key=lambda c: c.x0)
+    words = []
+    cur, cur_x0, cur_x1 = "", None, None
+    for c in cs:
+        if c.text.isspace():
+            if cur:
+                words.append((cur, cur_x0, cur_x1))
+                cur = ""
+            continue
+        if cur and (c.x0 - cur_x1) > min_gap:
+            words.append((cur, cur_x0, cur_x1))
+            cur = ""
+        if not cur:
+            cur_x0 = c.x0
+        cur += c.text
+        cur_x1 = c.x1
+    if cur:
+        words.append((cur, cur_x0, cur_x1))
+    return words
+
+
+def detect_summary_columns(lines: List[Line], start_idx: int) -> Optional[tuple[int, List[Column]]]:
+    """Find the SUMMARY table header. Same window approach as DETAILED:
+    a contiguous span of lines within HEADER_WINDOW_Y pts that
+    collectively contain ≥ SUMMARY_MIN_HITS distinct header keywords.
+
+    Returns (index_of_last_line_in_header, ordered columns).
+    """
+    for i in range(start_idx, len(lines)):
+        window = [lines[i]]
+        for j in range(i + 1, len(lines)):
+            if lines[i].baseline - lines[j].baseline > HEADER_WINDOW_Y:
+                break
+            window.append(lines[j])
+
+        words: List[tuple[str, float, float]] = []
+        for ln in window:
+            words.extend(_words_on_line(ln))
+        labels = {w[0] for w in words if w[0] in SUMMARY_HEADER_LABELS}
+        if len(labels) >= SUMMARY_MIN_HITS and "Folio" in labels and "Scheme" in labels:
+            last_idx = i + len(window) - 1
+            return last_idx, _build_summary_columns(words)
+    return None
+
+
+def _build_summary_columns(words: List[tuple[str, float, float]]) -> List[Column]:
+    """Cluster header words by x-proximity (across all baselines), then
+    pick a canonical column for each cluster based on which tokens are
+    present. Order of words within a cluster doesn't matter — KFin
+    splits "Closing Unit Balance" across baselines so the x-sorted
+    order interleaves to "Closing Balance Unit"."""
+    sorted_words = sorted(words, key=lambda w: w[1])
+    clusters: List[List[tuple[str, float, float]]] = []
+    cur: List[tuple[str, float, float]] = []
+    cur_max_x1 = 0.0
+    for w in sorted_words:
+        if cur and (w[1] - cur_max_x1) > XCLUSTER_GAP:
+            clusters.append(cur)
+            cur = []
+            cur_max_x1 = 0.0
+        cur.append(w)
+        cur_max_x1 = max(cur_max_x1, w[2])
+    if cur:
+        clusters.append(cur)
+
+    cols: List[Column] = []
+    seen_labels: set[str] = set()
+    for cluster in clusters:
+        tokens = {w[0] for w in cluster}
+        for required, optional, label, align in COLUMN_RULES:
+            if required.issubset(tokens) and label not in seen_labels:
+                x0 = min(w[1] for w in cluster)
+                x1 = max(w[2] for w in cluster)
+                cols.append(Column(label=label, x_lo=x0, x_hi=x1, alignment=align))
+                seen_labels.add(label)
+                break
+    cols.sort(key=lambda c: c.x_lo)
+    return cols
+
+
+# -----------------------------------------------------------------------------
+# Cell assignment (SUMMARY-specific zones)
+# -----------------------------------------------------------------------------
+
+# Numeric value widths in SUMMARY are narrower than DETAILED (cost/value
+# rarely exceed 13 chars). NAVDate values extend LEFTWARD of the "NAV
+# Date" label, so we treat it like a right-aligned column but with the
+# label's left edge as the right edge of its zone.
+
+NUMERIC_WIDTH = 42.0  # pts; widest expected numeric value in SUMMARY
+
+
+def _summary_column_ranges(columns: List[Column]) -> List[tuple[Column, float, float]]:
+    """Compute x-range per column.
+
+    LEFT-aligned (incl. NAVDate, whose value `01-Jan-2015` extends
+    further right than the `NAV Date` header label): from `x_lo-3` to
+    just before the next column's zone.
+    RIGHT-aligned numerics: from `x_hi - NUMERIC_WIDTH` to `x_hi+3`.
+    """
+    sorted_cols = sorted(columns, key=lambda c: (c.x_lo + c.x_hi) / 2)
+    ranges = []
+    for i, col in enumerate(sorted_cols):
+        if col.alignment == "right":
+            lo = col.x_hi - NUMERIC_WIDTH
+            hi = col.x_hi + 3.0
+        else:
+            lo = col.x_lo - 3.0
+            if i + 1 < len(sorted_cols):
+                nxt = sorted_cols[i + 1]
+                if nxt.alignment == "right":
+                    hi = nxt.x_hi - NUMERIC_WIDTH
+                else:
+                    hi = nxt.x_lo - 3.0
+            else:
+                hi = float("inf")
+        ranges.append((col, lo, hi))
+    return ranges
+
+
+def assign_summary_cells(line: Line, columns: List[Column]) -> dict[str, str]:
+    ranges = _summary_column_ranges(columns)
+    cells: dict[str, list[Char]] = {c.label: [] for c in columns}
+    for ch in line.chars:
+        x_mid = (ch.x0 + ch.x1) / 2
+        for col, lo, hi in ranges:
+            if lo <= x_mid < hi:
+                cells[col.label].append(ch)
+                break
+    out = {}
+    for label, chars in cells.items():
+        if not chars:
+            continue
+        chars.sort(key=lambda c: c.x0)
+        heights = sorted(c.h for c in chars)
+        h_med = heights[len(heights) // 2]
+        gap = max(1.5, 0.6 * h_med)
+        parts, prev_x1 = [], None
+        for c in chars:
+            if prev_x1 is not None and (c.x0 - prev_x1) > gap:
+                parts.append(" ")
+            parts.append(c.text)
+            prev_x1 = c.x1
+        out[label] = "".join(parts).strip()
+    return out
+
+
+# -----------------------------------------------------------------------------
+# Parsing
+# -----------------------------------------------------------------------------
+
+# Folio must have ≥6 digits — short numbers like '0' or '11' in
+# disclaimer text aren't real folio numbers. Sub-account "/N" is
+# optional.
+FOLIO_CELL_RE = re.compile(r"^\s*(\d{6,}(?:\s*/\s*\d+)?)")
+ISIN_CELL_RE = re.compile(r"(INF[A-Z0-9]{8}\d)")
+SUMMARY_DATE_RE = re.compile(r"as\s+on\s+(\d{2}-[A-Za-z]{3}-\d{4})", re.I)
+# Scheme cell: looks like "<RTA_CODE>-<scheme name>". RTA code is short
+# alphanumeric (3-15 chars, no spaces), then dash, then more text.
+SCHEME_CELL_RE = re.compile(r"^\s*([\w\s]{2,15}?)\s*-\s*(.+)$")
+# Scheme cell looks like data when it starts with an alphanumeric RTA
+# code (letters or digits, ≤16 chars incl. internal space), then a dash,
+# then the scheme name. Examples: "D110 - DSP...", "117 IOD1G-Mirae...",
+# "PP001ZG-Parag...". Disclaimer rows lack this exact prefix shape.
+SCHEME_LOOKS_LIKE_DATA = re.compile(r"^\s*[A-Z0-9][\w\s]{1,15}\s*-\s*\S")
+
+
+def parse(
+    pdf_path: str,
+    password: str,
+    file_type: FileType = FileType.UNKNOWN,
+    *,
+    _doc=None,
+) -> CASData:
+    pages = extract_pages(pdf_path, password, _doc=_doc)
+
+    statement_date: Optional[str] = None
+    folios: dict[str, Folio] = {}
+    current_amc: Optional[str] = None
+    current_folio: Optional[Folio] = None
+    current_scheme: Optional[Scheme] = None
+    last_columns: List[Column] = []
+
+    for page in pages:
+        header_pos = detect_summary_columns(page.lines, 0)
+        if header_pos:
+            header_idx, columns = header_pos
+            last_columns = columns
+        else:
+            header_idx = -1
+            columns = last_columns
+
+        for i, line in enumerate(page.lines):
+            text = line.text
+
+            # --- statement date (single date for SUMMARY) ---
+            if statement_date is None:
+                if m := SUMMARY_DATE_RE.search(text):
+                    statement_date = m.group(1)
+
+            # --- AMC header (between groups of folios) ---
+            if m := AMC_RE.match(text.strip()):
+                current_amc = m.group(0)
+                continue
+
+            if not columns or header_idx is None or i <= header_idx:
+                continue
+
+            cells = assign_summary_cells(line, columns)
+            folio_cell = cells.get("Folio", "").strip()
+            # Some PDFs have folio "/0" suffix overflowing into the ISIN
+            # column. Folios can also bleed into ISIN if very long. Use
+            # the cell text as a hint and pull the ISIN by regex.
+            isin_raw = cells.get("ISIN", "").strip()
+            m_isin = ISIN_CELL_RE.search(isin_raw) or ISIN_CELL_RE.search(folio_cell)
+            isin_cell = m_isin.group(1) if m_isin else ""
+            # If folio was truncated because of "/0" overflow, recover
+            # by taking the leading folio pattern. If no match, the cell
+            # holds non-folio text (disclaimer / wrapped scheme name) —
+            # clear it so we don't treat the row as a main row.
+            m_folio = FOLIO_CELL_RE.match(folio_cell)
+            folio_cell = m_folio.group(1).strip() if m_folio else ""
+            scheme_cell = cells.get("Scheme", "").strip()
+            balance_cell = cells.get("Balance", "").strip()
+            nav_date_cell = cells.get("NAVDate", "").strip()
+            nav_cell = cells.get("NAV", "").strip()
+            value_cell = cells.get("MarketValue", "").strip()
+            cost_cell = cells.get("Cost", "").strip()
+            rta_cell = cells.get("Registrar", "").strip()
+
+            # A "main" row is one that has BOTH a folio number AND a
+            # scheme name that looks like "<RTA_CODE>-<name>". This
+            # rejects disclaimer/footer text that happens to land
+            # partly in the folio or scheme x-zones.
+            is_main = (
+                bool(folio_cell)
+                and bool(scheme_cell)
+                and bool(SCHEME_LOOKS_LIKE_DATA.match(scheme_cell))
+            )
+            is_continuation = (
+                current_scheme is not None
+                and not folio_cell
+                and scheme_cell
+                and not nav_date_cell
+                and not balance_cell
+            )
+
+            if is_main:
+                # Finalise previous scheme implicitly (it stays in its folio).
+                folio_no = folio_cell.strip()
+                if folio_no not in folios:
+                    folios[folio_no] = Folio(
+                        folio=folio_no,
+                        amc=current_amc or "UNKNOWN",
+                        PAN="",
+                        KYC=None,
+                        PANKYC=None,
+                        schemes=[],
+                    )
+                current_folio = folios[folio_no]
+
+                # Split rta_code from scheme name: "D110-DSP ELSS..." →
+                # code=D110, name=DSP ELSS...
+                code = ""
+                name = scheme_cell
+                if m := SCHEME_CELL_RE.match(scheme_cell):
+                    code = m.group(1).strip()
+                    name = m.group(2).strip()
+
+                balance = _decimal(balance_cell) or Decimal(0)
+                nav = _decimal(nav_cell) or Decimal(0)
+                cost = _decimal(cost_cell) if cost_cell else None
+                market_value = _decimal(value_cell) or Decimal(0)
+                isin = isin_cell or None
+
+                # NAV date — convert to a real `date` object so Pydantic
+                # doesn't try to coerce a `"01-Jan-2015"` string as if it
+                # were ISO-format (which mis-parses to year 201). Default
+                # to the statement date when the per-scheme NAV date cell
+                # is empty.
+                try:
+                    if nav_date_cell:
+                        nav_date = dateparse.parse(re.sub(r"[-\s]+", "-", nav_date_cell)).date()
+                    elif statement_date:
+                        nav_date = dateparse.parse(statement_date).date()
+                    else:
+                        nav_date = dateparse.parse("1970-01-01").date()
+                except Exception:
+                    nav_date = dateparse.parse("1970-01-01").date()
+
+                rta_for_lookup = rta_cell or "CAMS"
+                resolved_isin, amfi, scheme_type = isin_search(
+                    name,
+                    rta_for_lookup,
+                    code,
+                    isin=isin,
+                )
+                current_scheme = Scheme(
+                    scheme=name,
+                    advisor=None,
+                    rta=rta_for_lookup,
+                    rta_code=code,
+                    isin=resolved_isin or isin,
+                    amfi=amfi,
+                    type=scheme_type or "N/A",
+                    open=balance,
+                    close=balance,
+                    close_calculated=balance,
+                    valuation=SchemeValuation(
+                        date=nav_date,
+                        nav=nav,
+                        value=market_value,
+                        cost=cost,
+                    ),
+                    transactions=[],
+                )
+                current_folio.schemes.append(current_scheme)
+                continue
+
+            if is_continuation:
+                # Append the wrap text to the previous scheme's name.
+                current_scheme.scheme = (current_scheme.scheme + " " + scheme_cell).strip()
+
+    return CASData(
+        statement_period=(
+            StatementPeriod(from_=statement_date, to=statement_date)
+            if statement_date
+            else StatementPeriod(**{"from": "", "to": ""})
+        ),
+        folios=list(folios.values()),
+        investor_info=extract_cams_kfin_investor(pdf_path, password, _doc=_doc),
+        cas_type=CASFileType.SUMMARY,
+        file_type=file_type,
+    )
diff --git a/casparser/parsers/cdsl.py b/casparser/parsers/cdsl.py
new file mode 100644
index 0000000..ae5dfb8
--- /dev/null
+++ b/casparser/parsers/cdsl.py
@@ -0,0 +1,576 @@
+"""Dedicated CDSL parser.
+
+Like `nsdl_parser`, this consumes structured `Block`/`Cell` data from
+`pageobj.extract_blocks` and emits an `NSDLCASData` directly — no
+detour through PROD's `process_cdsl_text`.
+
+CDSL CAS layout (in document order; absolute page numbers vary by
+holding count):
+
+  - **Cover + account roster** — investor address block followed by the
+    "Account Type / Account Details / ISINs / Value" summary table that
+    enumerates each demat account and the MF-folios pseudo-account.
+  - **Per-MF-folio descriptive blocks** — AMC Name, Scheme Name,
+    Folio No, KYC, ISIN/UCC/RTA, one block group per folio. No
+    balances here.
+  - **Per-account transaction sections + holdings tables** — each
+    section starts with `DP Name : <broker> ... BO ID :
+    <dpid+clientid>`, followed by transactions, then a
+    `HOLDING STATEMENT AS ON` header and the holdings table itself
+    (9-10 cells per row).
+  - **`MUTUAL FUND UNITS HELD AS ON` table** — one row per MF folio
+    with full P&L (scheme name, ISIN, folio, ARN code, units, NAV,
+    invested, current value, TER, commission, profit, return%).
+  - **Notes / footer** at the end.
+
+Some CDSL PDFs ship with a heavy Hindi-font overlay that makes
+roughly half the table cells unreadable by content-stream extraction
+(PROD fails on them too). The atom-level overlay filter in
+`extract.py` recovers most of these; the remainder need a smarter
+font-aware extractor and are out of scope here.
+"""
+
+from __future__ import annotations
+
+import re
+from decimal import Decimal, InvalidOperation
+from typing import Dict, List, Optional, Tuple
+
+from casparser.enums import FileType
+from casparser.types import (
+    DematAccount,
+    DematOwner,
+    Equity,
+    MutualFund,
+    NSDLCASData,
+    StatementPeriod,
+)
+
+from . import pageobj
+from ._investor import extract_nsdl_cdsl_investor
+from .pageobj import Block
+
+# --- patterns ---
+
+ISIN_RE = re.compile(r"^[A-Z]{2}[0-9A-Z]{9}\d$")
+INF_ISIN_RE = re.compile(r"^INF[0-9A-Z]{8}\d$")
+INE_ISIN_RE = re.compile(r"^IN[E9][0-9A-Z]{8}\d$")
+NUMERIC_RE = re.compile(r"^-?[\d,]+(?:\.\d+)?$")
+
+PERIOD_RE = re.compile(
+    r"(?:for\s+the\s+period\s+from|statement\s+for\s+the\s+period\s+from)\s+"
+    r"(\d{2}[-/][A-Za-z0-9]{2,3}[-/]\d{4})\s+to\s+(\d{2}[-/][A-Za-z0-9]{2,3}[-/]\d{4})",
+    re.I,
+)
+
+DEMAT_TYPE_RE = re.compile(r"^(CDSL|NSDL)\s+Demat\s+Account\s*$", re.I)
+PAN_RE = re.compile(r"(.+?)\s*\(\s*PAN\s*:\s*([^)]+?)\s*\)", re.I)
+
+# Page-2 summary row carries `DP Id: <dp> Client Id : <client>`
+# (whitespace around the colons varies).
+SUMMARY_DPC_RE = re.compile(
+    r"DP\s*Id\s*:\s*(\S+?)\s+Client\s*Id\s*:\s*(\d+)",
+    re.I,
+)
+# Per-account holdings header: `DP Name : <broker>  DP ID : <dp>
+# CLIENT ID : <client>`.
+SECTION_DPC_RE = re.compile(
+    r"DP\s*Name\s*:\s*(.+?)\s+DP\s*ID\s*:\s*(\S+)\s+CLIENT\s*ID\s*:\s*(\S+)",
+    re.I | re.S,
+)
+# Transaction-page header: `DP Name : <broker>  BO ID : <16-char id>`.
+# The id concatenates DP ID + Client ID, both 8 chars. CDSL DP IDs are
+# numeric, NSDL DP IDs start with `IN`, so the 16-char field can be all
+# digits (CDSL) or two letters + 14 digits (NSDL).
+SECTION_BOID_RE = re.compile(
+    r"DP\s*Name\s*:\s*(.+?)\s+(?:BO\s*ID|DPID)\s*:\s*([A-Z0-9]{16})",
+    re.I | re.S,
+)
+
+
+# --- decimal helpers ---
+
+
+def _to_decimal(text) -> Decimal:
+    if text is None:
+        return Decimal(0)
+    s = str(text).replace(",", "").strip()
+    if not s or s in ("-", "--", "N.A", "NA"):
+        return Decimal(0)
+    try:
+        return Decimal(s)
+    except InvalidOperation:
+        return Decimal(0)
+
+
+def _opt_decimal(text) -> Optional[Decimal]:
+    if text is None:
+        return None
+    s = str(text).replace(",", "").strip()
+    if not s or s in ("-", "--", "N.A", "NA"):
+        return None
+    try:
+        return Decimal(s)
+    except InvalidOperation:
+        return None
+
+
+def _looks_numeric(text: str) -> bool:
+    s = text.strip()
+    if not s:
+        return False
+    return bool(NUMERIC_RE.match(s))
+
+
+# --- account key utilities ---
+
+
+def _full_type(type_word: str) -> str:
+    return f"{type_word.upper()} Demat Account"
+
+
+def _account_key(type_word: str, dp_id: str, client_id: str) -> Tuple[str, str, str]:
+    return (type_word.upper(), dp_id.strip(), client_id.strip())
+
+
+def _split_bo_id(bo_id: str) -> Tuple[str, str, str]:
+    """16-char BO ID → `(type_word, dp_id, client_id)`.
+
+    NSDL DP IDs start with `IN` (8 chars total), CDSL DP IDs are pure
+    digits. Both followed by an 8-digit Client ID."""
+    if len(bo_id) != 16:
+        return "", "", ""
+    if bo_id[:2].upper() == "IN":
+        return "NSDL", bo_id[:8], bo_id[8:]
+    if bo_id.isdigit():
+        return "CDSL", bo_id[:8], bo_id[8:]
+    return "", "", ""
+
+
+# --- parser entry point ---
+
+
+def parse_cdsl(
+    pdf_path: str,
+    password: str,
+    file_type: FileType = FileType.CDSL,
+    *,
+    _doc=None,
+) -> NSDLCASData:
+    atoms = pageobj.extract_atoms(pdf_path, password, _doc=_doc)
+    blocks = pageobj.blocks_from_atoms(atoms)
+    period = _find_period(blocks) or StatementPeriod(**{"from": "", "to": ""})
+
+    # Phase 1: account roster from page 2 summary.
+    accounts_by_key: Dict[Tuple[str, str, str], DematAccount] = {}
+    ordered_accounts: List[DematAccount] = []
+    mf_folios_account: Optional[DematAccount] = None
+    pending_owners: List[DematOwner] = []
+
+    for b in blocks:
+        if b.page != 2:
+            continue
+        txt = b.text()
+        ltxt = txt.lower()
+        if "in the single name of" in ltxt or "in the joint name" in ltxt:
+            pending_owners = []
+            continue
+        if PAN_RE.search(txt) and "Mutual" not in txt:
+            for m in PAN_RE.finditer(txt):
+                pending_owners.append(
+                    DematOwner(
+                        name=m.group(1).strip(),
+                        PAN=m.group(2).strip(),
+                    )
+                )
+            continue
+        if _is_summary_demat_row(b):
+            ac, key = _account_from_summary_row(b, pending_owners)
+            if key not in accounts_by_key:
+                accounts_by_key[key] = ac
+                ordered_accounts.append(ac)
+            continue
+        if _is_summary_mf_folios_row(b):
+            if mf_folios_account is None:
+                mf_folios_account = _mf_folios_account_from_summary(b, pending_owners)
+                ordered_accounts.append(mf_folios_account)
+            continue
+
+    # Phase 2: scheme-code → (ISIN, UCC, folio, name) map from the
+    # descriptive MF blocks that follow the roster page. Their page
+    # span depends on how many MF folios the investor holds; we
+    # bound-scan from page 3 up to the start of the per-account
+    # transaction section (detected via the `BO ID :` / `DPID :`
+    # marker), and only consume blocks that match the descriptive
+    # template (Scheme Name + Scheme Code + ISIN + UCC).
+    scheme_meta: Dict[str, Dict[str, str]] = {}
+    pending_scheme: Dict[str, str] = {}
+    for b in blocks:
+        if b.page < 3:
+            continue
+        if SECTION_BOID_RE.search(b.text()):
+            break
+        txt = b.text()
+        if "Scheme Name :" in txt and "Scheme Code :" in txt:
+            sm = re.search(
+                r"Scheme\s*Name\s*:\s*(.+?)\s+Scheme\s*Code\s*:\s*(\S+)",
+                txt,
+                re.S,
+            )
+            if sm:
+                pending_scheme = {
+                    "scheme_name": sm.group(1).replace("\n", " ").strip(),
+                    "scheme_code": sm.group(2).strip(),
+                }
+        elif "Folio No :" in txt:
+            fm = re.search(r"Folio\s*No\s*:\s*(\S+)", txt)
+            if fm:
+                pending_scheme["folio"] = fm.group(1)
+        elif "ISIN :" in txt and "UCC" in txt:
+            im = re.search(r"ISIN\s*:\s*(\S+)", txt)
+            um = re.search(r"UCC\s*:\s*([\w/]+)?", txt)
+            if im and pending_scheme.get("scheme_code"):
+                pending_scheme["isin"] = im.group(1)
+                if um and um.group(1):
+                    pending_scheme["ucc"] = um.group(1)
+                scheme_meta[pending_scheme["scheme_code"]] = dict(pending_scheme)
+                pending_scheme = {}
+
+    # Phase 3: walk all post-cover pages for holdings tables.
+    # We skip pages 1-2 (cover + roster) because the roster lines
+    # contain CDSL/NSDL identifiers that would otherwise look like
+    # section headers; the dispatch logic below handles the rest.
+    cur_account: Optional[DematAccount] = None
+    cur_mode: Optional[str] = None  # 'equities' | 'mf_holdings'
+
+    for b in blocks:
+        if b.page < 3:
+            continue
+        txt = b.text()
+        ltxt = txt.lower()
+
+        # Per-account section header — `DP Name : ... BO ID : ...`
+        # or `DP Name : ... DPID : ...` (NSDL variant) form.
+        m = SECTION_BOID_RE.search(txt)
+        if m:
+            broker = m.group(1).strip()
+            bo_id = m.group(2)
+            type_word, dp_id, client_id = _split_bo_id(bo_id)
+            if type_word:
+                ac_key = _account_key(type_word, dp_id, client_id)
+                cur_account = accounts_by_key.get(ac_key)
+                cur_mode = None
+                continue
+
+        # Or "DP Name : ... DP ID : ... CLIENT ID : ..."
+        m = SECTION_DPC_RE.search(txt)
+        if m:
+            type_word = "CDSL"
+            if "NSDL" in txt.upper() and "CDSL" not in txt.upper():
+                type_word = "NSDL"
+            broker, dp_id, client_id = m.groups()
+            ac_key = _account_key(type_word, dp_id.strip(), client_id.strip())
+            cur_account = accounts_by_key.get(ac_key)
+            cur_mode = None
+            continue
+
+        # Transaction-statement section — switch OFF holdings mode so
+        # transaction rows aren't parsed as equity rows.
+        if "statement of transactions" in ltxt:
+            cur_mode = None
+            continue
+
+        # Holdings section markers
+        if "holding statement" in ltxt and "as on" in ltxt:
+            cur_mode = "equities"
+            continue
+        if "mutual fund units held as on" in ltxt:
+            cur_account = mf_folios_account
+            cur_mode = "mf_holdings"
+            continue
+
+        # Skip column-header rows
+        if _is_holdings_header(b) or _is_total_row(b):
+            continue
+
+        # Holdings rows
+        if cur_account is None or cur_mode is None:
+            continue
+        if cur_mode == "equities":
+            row = _parse_holdings_row(b)
+            if row is None:
+                pass
+            else:
+                isin, name, num_shares, price, value = row
+                # CDSL Demat statements list ETFs (ISIN starting with
+                # INF) in the same holdings table as equities, but
+                # they're semantically mutual-fund units. Route them
+                # to the mutual_funds list to mirror PROD's
+                # classification.
+                if INF_ISIN_RE.match(isin):
+                    cur_account.mutual_funds.append(
+                        MutualFund(
+                            name=name,
+                            isin=isin,
+                            balance=num_shares,
+                            nav=price,
+                            value=value,
+                        )
+                    )
+                else:
+                    cur_account.equities.append(
+                        Equity(
+                            name=name,
+                            isin=isin,
+                            num_shares=num_shares,
+                            price=price,
+                            value=value,
+                        )
+                    )
+        elif cur_mode == "mf_holdings":
+            mf = _parse_mf_holdings_row(b, scheme_meta)
+            if mf:
+                cur_account.mutual_funds.append(mf)
+
+    return NSDLCASData(
+        statement_period=period,
+        accounts=ordered_accounts,
+        investor_info=extract_nsdl_cdsl_investor(
+            pdf_path,
+            password,
+            _atoms=atoms,
+        ),
+        file_type=file_type,
+    )
+
+
+# --- summary-row recognisers (page 2) ---
+
+
+def _is_summary_demat_row(block: Block) -> bool:
+    if len(block.cells) != 4:
+        return False
+    if not DEMAT_TYPE_RE.match(block.cells[0].text.strip()):
+        return False
+    return bool(SUMMARY_DPC_RE.search(block.cells[1].text))
+
+
+def _is_summary_mf_folios_row(block: Block) -> bool:
+    if len(block.cells) != 4:
+        return False
+    return bool(re.match(r"^Mutual\s+Fund\s+Folios", block.cells[0].text.strip(), re.I))
+
+
+def _account_from_summary_row(
+    block: Block, owners: List[DematOwner]
+) -> Tuple[DematAccount, Tuple[str, str, str]]:
+    type_word = DEMAT_TYPE_RE.match(block.cells[0].text.strip()).group(1).upper()
+    broker_dp = block.cells[1].text
+    lines = [ln.strip() for ln in broker_dp.split("\n") if ln.strip()]
+    broker = lines[0] if lines else ""
+    dpc = SUMMARY_DPC_RE.search(broker_dp)
+    dp_id = dpc.group(1) if dpc else ""
+    client_id = dpc.group(2) if dpc else ""
+    folios = int(_to_decimal(block.cells[2].text))
+    balance = _to_decimal(block.cells[3].text)
+    ac = DematAccount(
+        name=broker,
+        type=_full_type(type_word),
+        dp_id=dp_id,
+        client_id=client_id,
+        folios=folios,
+        balance=balance,
+        owners=list(owners),
+        equities=[],
+        mutual_funds=[],
+    )
+    return ac, _account_key(type_word, dp_id, client_id)
+
+
+def _mf_folios_account_from_summary(block: Block, owners: List[DematOwner]) -> DematAccount:
+    folios_m = re.search(r"(\d+)", block.cells[1].text)
+    folios = int(folios_m.group(1)) if folios_m else 0
+    balance = _to_decimal(block.cells[3].text)
+    return DematAccount(
+        name="Mutual Fund Folios",
+        type="Mutual Fund Folios",
+        dp_id="",
+        client_id="",
+        folios=folios,
+        balance=balance,
+        owners=list(owners),
+        equities=[],
+        mutual_funds=[],
+    )
+
+
+# --- helpers ---
+
+
+def _find_period(blocks: List[Block]) -> Optional[StatementPeriod]:
+    for b in blocks:
+        m = PERIOD_RE.search(b.text())
+        if m:
+            return StatementPeriod(**{"from": m.group(1), "to": m.group(2)})
+    return None
+
+
+def _is_holdings_header(block: Block) -> bool:
+    """Block has no ISIN and looks like a column-label row."""
+    txt = block.text()
+    if re.search(r"\b(IN[EF9][0-9A-Z]{8}\d)\b", txt, re.I):
+        return False
+    ltxt = txt.lower().replace("\n", " ").replace("\t\t", " ")
+    if "isin" in ltxt and ("security" in ltxt or "scheme name" in ltxt):
+        return True
+    if "current" in ltxt and "bal" in ltxt and "market" in ltxt:
+        return True
+    return False
+
+
+def _is_total_row(block: Block) -> bool:
+    first = block.cells[0].text.strip().lower() if block.cells else ""
+    return first in ("sub total", "total", "grand total")
+
+
+# --- equity holdings row ---
+
+
+def _parse_holdings_row(block: Block) -> Optional[Tuple[str, str, Decimal, Decimal, Decimal]]:
+    """CDSL holdings row → `(isin, name, num_shares, price, value)`.
+
+    Column layout (post-`HOLDING STATEMENT`):
+      ISIN | Security | Current Bal | Frozen Bal | Pledge Bal |
+      Pledge Setup Bal | Free Bal | Market Price | Value (`)
+
+    A few rows have a leading '@' marker cell between ISIN and name
+    (suspended issue notation). Rows with all-`--` quantity cells
+    (rights entitlements that haven't been exercised) are still
+    parsed — `_to_decimal` maps `--` to 0. We use position-based
+    assignment, not the last-three-numerics heuristic, because some
+    rows have only 2 numeric cells (price + value) when all balance
+    columns are `--`."""
+    if not block.cells:
+        return None
+    first = block.cells[0].text.strip()
+    if not ISIN_RE.match(first):
+        return None
+    isin = first
+
+    # Find the data-cell boundary: the first cell after ISIN whose
+    # text is a number or `--`. Everything between ISIN and that cell
+    # is part of the security name (PDF renderer sometimes splits
+    # multi-line security names across several cells with different
+    # x-positions).
+    data_start = None
+    for i in range(1, len(block.cells)):
+        t = block.cells[i].text.strip()
+        if _looks_numeric(t) or t in ("--", "-"):
+            data_start = i
+            break
+    if data_start is None or len(block.cells) - data_start < 3:
+        return None
+    name = (
+        " ".join(
+            c.text.replace("\n", " ").strip()
+            for c in block.cells[1:data_start]
+            if c.text.strip() and c.text.strip() not in ("@",)
+        )
+        or None
+    )
+
+    num_shares = _to_decimal(block.cells[data_start].text)
+    price = _to_decimal(block.cells[-2].text)
+    value = _to_decimal(block.cells[-1].text)
+    return isin, name, num_shares, price, value
+
+
+# --- MF holdings row (the `MUTUAL FUND UNITS HELD AS ON` section) ---
+
+
+def _parse_mf_holdings_row(
+    block: Block,
+    scheme_meta: Dict[str, Dict[str, str]],
+) -> Optional[MutualFund]:
+    """MF holdings table row. Two known templates:
+
+    - **With distribution-mode column (13 cells)**:
+        name | ISIN | folio | ARN-or-DIRECT | units | NAV | invested
+        | value | TER% | direct | commission | profit | return%
+
+    - **Without distribution-mode column (7 cells)**:
+        name | ISIN | folio | units | NAV | invested | value
+
+    Discriminator: the cell two positions after the ISIN. In the
+    13-cell layout it carries an alphanumeric distribution-mode label
+    (`ARN-####`, `DIRECT`, sometimes a folio-split fragment like
+    `4/0`). In the 7-cell layout it carries the units value (a pure
+    number). So if that cell isn't a clean number, we treat the row
+    as the 13-cell template.
+
+    Either way, we then filter the cells after `data_start` to numeric
+    tokens only — that picks the right values for balance/NAV/invested/
+    valuation regardless of whether the row had a split-folio quirk.
+    """
+    if len(block.cells) < 5:
+        return None
+    # Find the ISIN cell — usually cell 1.
+    isin_idx = None
+    for i in range(min(3, len(block.cells))):
+        s = block.cells[i].text.strip()
+        if ISIN_RE.match(s):
+            isin_idx = i
+            break
+    if isin_idx is None:
+        return None
+    isin = block.cells[isin_idx].text.strip()
+
+    # Name is whatever precedes the ISIN, joined.
+    name = (
+        " ".join(
+            c.text.replace("\n", " ").strip() for c in block.cells[:isin_idx] if c.text.strip()
+        )
+        or None
+    )
+
+    # Folio = cell right after ISIN (`<digits>/<digits>` or just digits).
+    folio = None
+    if isin_idx + 1 < len(block.cells):
+        folio = block.cells[isin_idx + 1].text.strip() or None
+
+    # Discriminate 13-cell (has ARN/DIRECT) vs 7-cell (no such column).
+    has_distrib_col = isin_idx + 2 < len(block.cells) and not _looks_numeric(
+        block.cells[isin_idx + 2].text
+    )
+    data_start = isin_idx + (3 if has_distrib_col else 2)
+    numerics = [c.text.strip() for c in block.cells[data_start:] if _looks_numeric(c.text)]
+    if len(numerics) < 3:
+        return None
+    balance = _to_decimal(numerics[0])
+    nav = _to_decimal(numerics[1])
+    invested = _opt_decimal(numerics[2])
+    value = _to_decimal(numerics[3]) if len(numerics) >= 4 else Decimal(0)
+    pnl = _opt_decimal(numerics[-2]) if has_distrib_col and len(numerics) >= 6 else None
+    ret = _opt_decimal(numerics[-1]) if has_distrib_col and len(numerics) >= 5 else None
+
+    # Pull UCC from scheme_meta keyed on scheme_code (prefix of name)
+    ucc = None
+    if name:
+        code_m = re.match(r"\s*([A-Z0-9]+)\s*-\s*", name)
+        if code_m:
+            meta = scheme_meta.get(code_m.group(1))
+            if meta:
+                ucc = meta.get("ucc")
+
+    return MutualFund(
+        name=name,
+        isin=isin,
+        balance=balance,
+        nav=nav,
+        value=value,
+        total_cost=invested,
+        ucc=ucc,
+        folio=folio,
+        pnl=pnl,
+        **{"return": ret},
+    )
diff --git a/casparser/parsers/detect.py b/casparser/parsers/detect.py
new file mode 100644
index 0000000..021d76f
--- /dev/null
+++ b/casparser/parsers/detect.py
@@ -0,0 +1,98 @@
+"""Detect the CAS issuer and statement variant from a PDF.
+
+We look at the first 1-2 pages of text for unambiguous source markers
+(CAMS / KFin watermark, NSDL / CDSL header strings) and the
+`Consolidated Account (Statement|Summary)` heading.
+
+All public functions accept an optional pre-opened `pdfium.PdfDocument`
+so the dispatcher can open the PDF exactly once per `read_cas_pdf`
+call. When `_doc` is `None`, the function falls back to opening from
+the path argument — keeping the path-based signature usable for
+direct calls (unit tests, third-party consumers).
+"""
+
+from __future__ import annotations
+
+import re
+from typing import Optional
+
+import pypdfium2 as pdfium
+from pypdfium2._helpers.misc import PdfiumError
+
+from casparser.enums import CASFileType, FileType
+from casparser.exceptions import CASParseError, IncorrectPasswordError
+
+_CAS_TYPE_RE = re.compile(
+    r"consolidated\s+account\s+(statement|summary)",
+    re.I,
+)
+
+
+def _open_document(pdf_path, password) -> pdfium.PdfDocument:
+    """Open a PDF with pypdfium2, translating PdfiumError into the
+    casparser exception hierarchy."""
+    try:
+        return pdfium.PdfDocument(pdf_path, password=password)
+    except PdfiumError as e:
+        msg = str(e)
+        if "PASSWORD" in msg.upper() or "password" in msg:
+            raise IncorrectPasswordError("Incorrect PDF password!") from e
+        raise CASParseError(f"Unhandled error while opening PDF: {msg}") from e
+    except TypeError as e:
+        raise CASParseError(f"Invalid input: {e}") from e
+
+
+def _read_text_sample(
+    pdf_path,
+    password,
+    max_pages: int = 2,
+    *,
+    _doc: Optional[pdfium.PdfDocument] = None,
+) -> str:
+    """Extract text from the first `max_pages` of the PDF."""
+    doc = _doc if _doc is not None else _open_document(pdf_path, password)
+    out = []
+    for page_num, page in enumerate(doc):
+        if page_num >= max_pages:
+            break
+        tp = page.get_textpage()
+        out.append(tp.get_text_bounded())
+    return "\n".join(out)
+
+
+def detect_file_type(
+    pdf_path,
+    password,
+    *,
+    _doc: Optional[pdfium.PdfDocument] = None,
+) -> FileType:
+    """Identify the issuer (CAMS / KFin / NSDL / CDSL) from the PDF
+    text. Raises nothing — returns `FileType.UNKNOWN` on no match."""
+    text = _read_text_sample(pdf_path, password, _doc=_doc)
+    if "CAMSCASWS" in text:
+        return FileType.CAMS
+    if "KFINCASWS" in text:
+        return FileType.KFINTECH
+    if "NSDL Consolidated Account Statement" in text or "About NSDL" in text:
+        return FileType.NSDL
+    if "Central Depository Services (India) Limited" in text:
+        return FileType.CDSL
+    return FileType.UNKNOWN
+
+
+def detect_cas_type(
+    pdf_path,
+    password,
+    *,
+    _doc: Optional[pdfium.PdfDocument] = None,
+) -> CASFileType:
+    """For CAMS / KFin only: SUMMARY vs DETAILED statement.
+    NSDL / CDSL don't have this split."""
+    text = _read_text_sample(pdf_path, password, max_pages=1, _doc=_doc)
+    if m := _CAS_TYPE_RE.search(text):
+        kind = m.group(1).lower().strip()
+        if kind == "statement":
+            return CASFileType.DETAILED
+        if kind == "summary":
+            return CASFileType.SUMMARY
+    return CASFileType.UNKNOWN
diff --git a/casparser/parsers/extract.py b/casparser/parsers/extract.py
new file mode 100644
index 0000000..1c52362
--- /dev/null
+++ b/casparser/parsers/extract.py
@@ -0,0 +1,394 @@
+"""Atom-based PDF text extraction for CAMS/KFin parsers.
+
+Walks PDF page objects — one per text-show operation (an *atom*) — and
+emits per-glyph `Char`s grouped by their parent atom. Overlay
+duplicates (the KFin date-twin pattern) are filtered at the atom level,
+which removes the need for the per-character overlay heuristics earlier
+versions used.
+
+Why atom-based extraction
+=========================
+
+CAS PDFs occasionally render the date column as TWO near-identical
+glyph layers in the same font, offset by ~0.7pt vertically. With pure
+per-glyph extraction we lose track of which glyph belongs to which
+text-show op, so the two layers end up sharing one logical line and the
+chars interleave by x — `2020` reads back as `22002200`, dateutil
+parses it as year 2200, and downstream gains / CSV-export code consumes
+garbage.
+
+PyMuPDF and pdfminer.six handle this case naturally because their text
+APIs return whole *strings* (one per text-show op), not glyphs. Each
+overlay layer comes back as its own string and is easy to dedup. We can
+do the same with PDFium's page-object API (``FPDFPage_GetObject`` +
+``FPDFTextObj_GetText``) — each text object is one atom, the atom's
+text is the un-interleaved string, and we can drop one of two atoms
+that visually overlap in the same font.
+
+Why we still need per-glyph positions
+=====================================
+
+`cams_detailed.py` uses precise per-glyph x positions for the table
+column anchors. So after dedup at the atom level, we expand each
+surviving atom back into per-glyph `Char`s using ``FPDFText_*``. The
+`Char` / `Line` / `Page` shape stays identical to earlier versions, so
+the downstream parsers don't change.
+
+The char→atom mapping uses PDFium's own ``FPDFText_GetTextObject``,
+which returns the text page object that produced each char. This is
+authoritative — PDFium walks the textpage in reading order (not
+content-stream order), so naive cursor-based indexing fails.
+
+Why baseline y not bbox y
+=========================
+
+Per-char y still uses ``FPDFText_GetCharOrigin`` — the typographic
+baseline, not the bbox bottom which varies with descenders. This keeps
+dashes and `g`/`y`/`p` glyphs at the same y as the rest of their line.
+"""
+
+from __future__ import annotations
+
+import ctypes
+from dataclasses import dataclass, field
+from typing import List, Optional
+
+import pypdfium2 as pdfium
+import pypdfium2.raw as pdfium_raw
+
+# Per-line baseline-clustering tolerance. With origin-based y, glyphs
+# from one text-show op share an exact baseline; 1.5pt absorbs the
+# small inter-atom drift you see between, e.g., a date atom and a
+# description atom on the same visual row, without merging genuinely
+# different rows that sit ~7pt+ apart.
+Y_TOL = 1.5
+
+# Row-clustering tolerance for the overlay dedup. Wider than `Y_TOL`
+# because we want both layers of an overlay pair (typically ~0.7pt
+# apart) AND the rest of the row's atoms to land in the same row. The
+# actual line clustering uses the tighter `Y_TOL`.
+Y_OVERLAY_ROW_TOL = 3.0
+
+# Minimum y-offset (pts) between two same-font atoms before we treat
+# them as candidates for being an overlay pair. Zero would mean "same
+# physical row" — those are legitimate side-by-side cells, not overlays.
+Y_OVERLAY_MIN_OFFSET = 0.05
+
+# Minimum x-overlap (as fraction of the narrower atom's width) required
+# for two same-font atoms to count as overlay duplicates rather than
+# just neighbouring columns.
+X_OVERLAY_MIN_FRAC = 0.5
+
+# Buffer size for the PDFium font-name lookup.
+_FONT_BUF_SIZE = 128
+
+# Fonts we drop wholesale. Mangal is the Devanagari font NSDL/CDSL CAS
+# files use to overlay Hindi translations on top of English text;
+# discarding it at extraction time keeps line clustering clean.
+_NON_LATIN_FONT_KEYWORDS = ("Mangal",)
+
+
+# ---------------------------------------------------------------------- types
+
+
+@dataclass
+class Char:
+    """One glyph at a known typographic position."""
+
+    text: str
+    x0: float
+    y0: float  # baseline (FPDFText_GetCharOrigin)
+    x1: float
+    y1: float  # visual glyph top
+    font: str = ""
+
+    @property
+    def h(self) -> float:
+        return self.y1 - self.y0
+
+
+@dataclass
+class Line:
+    page: int
+    baseline: float
+    chars: List[Char] = field(default_factory=list)
+
+    @property
+    def text(self) -> str:
+        """Reconstruct line text with spaces where x-gap is significant.
+
+        Gap threshold = ``0.6 × median char height`` (floored at 1.5pt).
+        Lower thresholds catch kerning gaps inside numerics (e.g.
+        ``'12124203'`` rendered as multiple text-show ops with ~2pt
+        jumps) so folio numbers and amounts don't fragment.
+        """
+        cs = sorted(self.chars, key=lambda c: c.x0)
+        if not cs:
+            return ""
+        heights = sorted(c.h for c in cs)
+        h_med = heights[len(heights) // 2]
+        gap = max(1.5, 0.6 * h_med)
+        out, prev_x1 = [], None
+        for c in cs:
+            if prev_x1 is not None and (c.x0 - prev_x1) > gap:
+                out.append(" ")
+            out.append(c.text)
+            prev_x1 = c.x1
+        return "".join(out)
+
+
+@dataclass
+class Page:
+    number: int
+    lines: List[Line]
+
+
+@dataclass
+class _Atom:
+    """One PDF text-show op, with its bbox, font, and the glyphs it emitted.
+
+    Internal to this module — `extract_pages` returns `Page`/`Line`/`Char`
+    so downstream parsers don't have to know about the atom layer.
+    """
+
+    x_left: float
+    x_right: float
+    y_top: float
+    y_bot: float
+    font: str
+    chars: List[Char] = field(default_factory=list)
+
+    @property
+    def width(self) -> float:
+        return self.x_right - self.x_left
+
+
+# ---------------------------------------------------------------------- helpers
+
+
+def _is_non_latin_font(font_name: str) -> bool:
+    base = font_name.split("+", 1)[-1] if "+" in font_name else font_name
+    return any(kw in base for kw in _NON_LATIN_FONT_KEYWORDS)
+
+
+def _strip_font_subset_prefix(name: str) -> str:
+    """Strip the 6-char ``<XXXXXX>+`` PDF subset prefix so the same
+    logical font compares equal across pages."""
+    return name.split("+", 1)[1] if "+" in name else name
+
+
+# ---------------------------------------------------------------------- API
+
+
+def extract_pages(
+    pdf_path: str,
+    password: str,
+    *,
+    _doc: "Optional[pdfium.PdfDocument]" = None,
+) -> List[Page]:
+    """Return one `Page` per PDF page, each containing baseline-clustered
+    `Line`s of `Char`s. See module docstring for the design rationale.
+
+    ``_doc``: pre-opened document supplied by the dispatcher. When not
+    provided, the function opens the PDF from `pdf_path` itself.
+    """
+    doc = _doc if _doc is not None else pdfium.PdfDocument(pdf_path, password=password)
+    pages: List[Page] = []
+    for page_num, page in enumerate(doc, start=1):
+        atoms = _walk_page_atoms(page)
+        atoms = _dedupe_overlay_atoms(atoms)
+        pages.append(Page(number=page_num, lines=_cluster_into_lines(atoms, page_num)))
+    return pages
+
+
+# ---------------------------------------------------------------------- atom walk
+
+
+def _walk_page_atoms(page) -> List[_Atom]:
+    """Walk every text page object on `page`, capturing each atom's
+    bbox, font, and the per-glyph `Char`s it contributed.
+
+    Char-to-atom mapping uses ``FPDFText_GetTextObject(textpage, i)``,
+    which is PDFium's own authoritative lookup. The textpage walks
+    chars in reading order (top-down, left-to-right), so cursor-based
+    indexing across page objects in stream order does not work.
+    """
+    page_handle = page.raw
+    tp = page.get_textpage()
+    tp_handle = tp.raw
+
+    # 1. Index page objects by handle so we can look up each char's
+    #    atom in O(1) below. The handle is the raw PDFium pointer
+    #    returned by FPDFPage_GetObject; comparing with `ctypes`
+    #    pointers requires holding the cast value (use the integer
+    #    address via ctypes.addressof, or compare ctypes void_p .value).
+    n_objects = pdfium_raw.FPDFPage_CountObjects(page_handle)
+    font_buf = (ctypes.c_char * _FONT_BUF_SIZE)()
+    left = ctypes.c_float()
+    bottom = ctypes.c_float()
+    right = ctypes.c_float()
+    top = ctypes.c_float()
+
+    obj_index: dict = {}  # handle-key -> _Atom (chars will be filled below)
+    obj_order: List[int] = []
+    for oi in range(n_objects):
+        obj = pdfium_raw.FPDFPage_GetObject(page_handle, oi)
+        if pdfium_raw.FPDFPageObj_GetType(obj) != pdfium_raw.FPDF_PAGEOBJ_TEXT:
+            continue
+        font_obj = pdfium_raw.FPDFTextObj_GetFont(obj)
+        fn = pdfium_raw.FPDFFont_GetBaseFontName(font_obj, font_buf, _FONT_BUF_SIZE)
+        raw_font = (
+            font_buf.raw[: max(0, fn - 1)].decode("utf-8", errors="replace") if fn > 0 else ""
+        )
+        if _is_non_latin_font(raw_font):
+            # Mark with a sentinel so chars routed here are dropped.
+            obj_index[_obj_key(obj)] = None
+            continue
+        pdfium_raw.FPDFPageObj_GetBounds(
+            obj,
+            ctypes.byref(left),
+            ctypes.byref(bottom),
+            ctypes.byref(right),
+            ctypes.byref(top),
+        )
+        key = _obj_key(obj)
+        obj_index[key] = _Atom(
+            x_left=left.value,
+            x_right=right.value,
+            y_top=top.value,
+            y_bot=bottom.value,
+            font=_strip_font_subset_prefix(raw_font),
+        )
+        obj_order.append(key)
+
+    # 2. Walk per-glyph chars. For each char, ask PDFium which text
+    #    object owns it and append the char to that atom's list.
+    n_chars = tp.count_chars()
+    ox = ctypes.c_double()
+    oy = ctypes.c_double()
+    for ci in range(n_chars):
+        ch = tp.get_text_range(ci, 1)
+        if ch in ("\r", "\n", "�"):
+            continue
+        x0, y0_bbox, x1, y1_bbox = tp.get_charbox(ci)
+        if y1_bbox - y0_bbox <= 0 or x1 - x0 <= 0:
+            continue
+        text_obj = pdfium_raw.FPDFText_GetTextObject(tp_handle, ci)
+        atom = obj_index.get(_obj_key(text_obj))
+        if atom is None:  # None == not text, or non-Latin (dropped)
+            continue
+        pdfium_raw.FPDFText_GetCharOrigin(tp_handle, ci, ox, oy)
+        atom.chars.append(
+            Char(
+                text=ch,
+                x0=x0,
+                y0=oy.value,
+                x1=x1,
+                y1=y1_bbox,
+                font=atom.font,
+            )
+        )
+
+    # 3. Return atoms in page-object order, dropping empties.
+    return [a for k in obj_order if (a := obj_index.get(k)) is not None and a.chars]
+
+
+def _obj_key(obj_ptr) -> int:
+    """Return a stable hashable key for a PDFium object pointer.
+
+    `FPDFPage_GetObject` and `FPDFText_GetTextObject` both return
+    raw ctypes pointer values; the address itself is what identifies
+    the underlying object.
+    """
+    if not obj_ptr:
+        return 0
+    if hasattr(obj_ptr, "value"):
+        return obj_ptr.value or 0
+    return ctypes.addressof(obj_ptr.contents) if obj_ptr else 0
+
+
+# ---------------------------------------------------------------------- overlay dedup
+
+
+def _dedupe_overlay_atoms(atoms: List[_Atom]) -> List[_Atom]:
+    """Drop atoms that are overlay duplicates of another atom on the
+    same visual row.
+
+    Detection: two atoms are an overlay pair if they share a font, their
+    x-ranges overlap by at least ``X_OVERLAY_MIN_FRAC`` of the narrower
+    atom's width, and their ``y_top`` values differ by between
+    ``Y_OVERLAY_MIN_OFFSET`` and ``Y_OVERLAY_ROW_TOL``. (Zero y-offset
+    means they're legitimate side-by-side cells; large y-offset means
+    they're on different rows.)
+
+    Resolution: pick the atom whose ``y_top`` is closer to the median
+    ``y_top`` of nearby atoms in the same row band. The "real" row
+    atoms cluster tightly around the median; the overlay sits a hair
+    above or below.
+    """
+    if len(atoms) < 2:
+        return atoms
+    # Bucket atoms into approximate rows.
+    sorted_atoms = sorted(enumerate(atoms), key=lambda p: -p[1].y_top)
+    rows: List[List[tuple]] = []
+    anchor: Optional[float] = None
+    for idx, a in sorted_atoms:
+        if anchor is None or abs(a.y_top - anchor) > Y_OVERLAY_ROW_TOL:
+            rows.append([(idx, a)])
+            anchor = a.y_top
+        else:
+            rows[-1].append((idx, a))
+
+    drop: set = set()
+    for row in rows:
+        if len(row) < 2:
+            continue
+        median_y = sorted(a.y_top for _, a in row)[len(row) // 2]
+        for ii in range(len(row)):
+            oi, ai = row[ii]
+            if oi in drop:
+                continue
+            for jj in range(ii + 1, len(row)):
+                oj, aj = row[jj]
+                if oj in drop or not ai.font or ai.font != aj.font:
+                    continue
+                # x-overlap as fraction of the narrower atom's width.
+                xo = min(ai.x_right, aj.x_right) - max(ai.x_left, aj.x_left)
+                if xo <= 0:
+                    continue
+                narrower = min(ai.width, aj.width)
+                if narrower <= 0 or xo / narrower < X_OVERLAY_MIN_FRAC:
+                    continue
+                # Same-row check: y-offset must be in the "overlay" band.
+                dy = abs(ai.y_top - aj.y_top)
+                if dy < Y_OVERLAY_MIN_OFFSET:
+                    continue
+                # Found a duplicate pair — drop the one further from median.
+                drop.add(oi if abs(ai.y_top - median_y) > abs(aj.y_top - median_y) else oj)
+
+    return [a for i, a in enumerate(atoms) if i not in drop]
+
+
+# ---------------------------------------------------------------------- line clustering
+
+
+def _cluster_into_lines(atoms: List[_Atom], page_num: int) -> List[Line]:
+    """Cluster surviving chars into top-down `Line`s by baseline y.
+
+    Within `Y_TOL` of the running baseline → same line; otherwise →
+    new line. The running average makes the line slowly track a
+    visual drift across many atoms (CAMS scheme + registrar wraps
+    on different baselines are intentionally merged this way).
+    """
+    all_chars = [c for a in atoms for c in a.chars]
+    all_chars.sort(key=lambda c: -c.y0)
+    lines: List[Line] = []
+    for c in all_chars:
+        if lines and abs(c.y0 - lines[-1].baseline) <= Y_TOL:
+            ln = lines[-1]
+            ln.chars.append(c)
+            n = len(ln.chars)
+            ln.baseline = (ln.baseline * (n - 1) + c.y0) / n
+        else:
+            lines.append(Line(page=page_num, baseline=c.y0, chars=[c]))
+    return lines
diff --git a/casparser/parsers/mupdf.py b/casparser/parsers/mupdf.py
deleted file mode 100644
index f1ce379..0000000
--- a/casparser/parsers/mupdf.py
+++ /dev/null
@@ -1,330 +0,0 @@
-import copy
-import io
-import re
-from operator import itemgetter
-from typing import Any, Iterator, List, Union
-
-# noinspection PyPackageRequirements
-import fitz
-
-from casparser.enums import FileType
-from casparser.exceptions import CASParseError, IncorrectPasswordError
-from casparser.types import InvestorInfo, PartialCASData
-
-from .utils import is_close
-
-
-def merge_bbox(bbox1, bbox2):
-    """Merge two pdf blocks' bounding boxes."""
-    return (
-        min(bbox1[0], bbox2[0]),  # x0
-        min(bbox1[1], bbox2[1]),  # y0
-        max(bbox1[2], bbox2[2]),  # x1
-        max(bbox1[3], bbox2[3]),  # y1
-    )
-
-
-def group_similar_blocks(blocks, file_type=FileType.UNKNOWN, mode="vertical"):
-    """Group overlapping blocks in a page."""
-    grouped_blocks = []
-    curr_y0 = -1
-    curr_y1 = -1
-    blocks = copy.deepcopy(blocks)
-
-    if mode == "vertical":
-        blocks = sorted(blocks, key=lambda x: (x["bbox"][0], x["bbox"][1]))
-    else:
-        blocks = sorted(blocks, key=lambda x: (x["bbox"][1], x["bbox"][0]))
-
-    for block in blocks:
-        x0, y0, x1, y1 = block["bbox"]
-        if abs(y1 - y0) > abs(x1 - x0) * 4:
-            # Ignore vertical elements. No useful info there.
-            continue
-        if (is_close(y0, curr_y0, 0.1) or curr_y0 <= y0 <= y1 <= curr_y1) and len(
-            grouped_blocks
-        ) > 0:
-            new_block = grouped_blocks.pop()
-            new_block["lines"].extend(block["lines"])
-            new_block["bbox"] = merge_bbox(new_block["bbox"], block["bbox"])
-        else:
-            new_block = block
-        grouped_blocks.append(new_block)
-        curr_y0 = new_block["bbox"][1]
-        curr_y1 = new_block["bbox"][3]
-
-    if mode == "vertical":
-        grouped_blocks = group_similar_blocks(
-            grouped_blocks, file_type=file_type, mode="horizontal"
-        )
-
-    return grouped_blocks
-
-
-def extract_blocks(page_dict, file_type=FileType.UNKNOWN):
-    """Extract text blocks from page dictionary.
-    The logic is similar to `PyMuPDF.TextPage.extractBLOCKS` but with a slightly better text
-    arrangement.
-    """
-    tolerance = {FileType.CAMS: 3, FileType.KFINTECH: 3, FileType.CDSL: 8, FileType.NSDL: 8}.get(
-        file_type, 3
-    )
-
-    # For NSDL/CDSL statements, holdings rows span multiple visual rows that
-    # represent a single logical entity; keep the legacy behaviour of joining
-    # them with ``\n`` so the downstream regexes (which use ``re.DOTALL``) can
-    # match across the rows.
-    split_rows = file_type not in (FileType.NSDL, FileType.CDSL)
-
-    blocks = []
-    grouped_blocks = group_similar_blocks(page_dict.get("blocks", []), file_type=file_type)
-
-    for num, block in enumerate(grouped_blocks):
-        rendered_rows = []
-        items = []
-        block["lines"] = sorted(block["lines"], key=lambda x: (x["bbox"][1], x["bbox"][0]))
-        y0 = block["lines"][0]["bbox"][1] if block.get("lines") else 0
-        y1 = block["lines"][0]["bbox"][3] if block.get("lines") else 0
-
-        def emit_row():
-            if not items:
-                return
-            full_text = "\t\t".join(
-                [x[0].strip() for x in sorted(items, key=lambda x: x[1][0]) if x[0].strip()]
-            )
-            if not full_text.strip():
-                return
-            if split_rows:
-                row_x0 = min(x[1][0] for x in items)
-                row_y0 = min(x[1][1] for x in items)
-                row_x1 = max(x[1][2] for x in items)
-                row_y1 = max(x[1][3] for x in items)
-                blocks.append([row_x0, row_y0, row_x1, row_y1, full_text])
-            else:
-                rendered_rows.append(full_text)
-
-        for line in block["lines"]:
-            if len(items) > 0 and not (
-                is_close(y0, line["bbox"][1], tol=tolerance)
-                or is_close(y1, line["bbox"][3], tol=tolerance)
-                or y0 <= line["bbox"][1] <= line["bbox"][3] <= y1
-            ):
-                emit_row()
-                items = []
-                y0, y1 = line["bbox"][1], line["bbox"][3]
-            else:
-                # Expand the band so subsequent lines that overlap with any
-                # previously-grouped item still get attached to the row.
-                y0 = min(y0, line["bbox"][1])
-                y1 = max(y1, line["bbox"][3])
-            line_text = "\t\t".join(
-                [
-                    span["text"].strip()
-                    for span in sorted(line["spans"], key=lambda x: (x["origin"][0]))
-                    if span["text"].strip()
-                ]
-            )
-            items.append([line_text, line["bbox"]])
-        emit_row()
-
-        if not split_rows and rendered_rows:
-            blocks.append([*block["bbox"], "\n".join(rendered_rows)])
-    return blocks
-
-
-def parse_file_type(blocks):
-    """Parse file type."""
-    for block in sorted(blocks, key=lambda x: -x["bbox"][1]):
-        block_str = str(block)
-        if re.search("CAMSCASWS", block_str):
-            return FileType.CAMS
-        elif re.search("KFINCASWS", block_str):
-            return FileType.KFINTECH
-        elif "NSDL Consolidated Account Statement" in block_str or "About NSDL" in block_str:
-            return FileType.NSDL
-        elif "Central Depository Services (India) Limited" in block_str:
-            return FileType.CDSL
-    return FileType.UNKNOWN
-
-
-def parse_investor_info_dp(page_dict, page_rect: fitz.Rect) -> InvestorInfo:
-    """Parse investor info."""
-    width = max(page_rect.width, 600)
-    height = max(page_rect.height, 800)
-
-    blocks = sorted(
-        [x for x in page_dict["blocks"] if x["bbox"][1] < height / 2], key=lambda x: x["bbox"][1]
-    )
-
-    address_lines = []
-    email = ""
-    mobile = None
-    name = None
-    cas_id_found = False
-    for block in blocks:
-        for line in block["lines"]:
-            for span in filter(
-                lambda x: x["bbox"][0] <= width / 2 and x["text"].strip() != "", line["spans"]
-            ):
-                txt = span["text"].strip()
-                if not cas_id_found:
-                    if m := re.search(r"[CAS|NSDL]\s+ID\s*:\s*(.+?)(?:\s|$)", txt, re.I):
-                        # email = m.group(1).strip()
-                        cas_id_found = True
-                    continue
-                if name is None:
-                    name = txt
-                else:
-                    if (
-                        re.search(
-                            r"Statement\s+for\s+the\s+period|Your\s+demat\s+account\s+and\s+mutual\s+fund",
-                            txt,
-                            re.I | re.MULTILINE,
-                        )
-                        or mobile is not None
-                    ):
-                        return InvestorInfo(
-                            email=email,
-                            name=name,
-                            mobile=mobile or "",
-                            address="\n".join(address_lines),
-                        )
-                    elif m := re.search(r"mobile\s*:\s*([+\d]+)(?:s|$)", txt, re.I):
-                        mobile = m.group(1).strip()
-                    address_lines.append(txt)
-    raise CASParseError("Unable to parse investor data")
-
-
-def parse_investor_info(page_dict, page_rect: fitz.Rect) -> InvestorInfo:
-    """Parse investor info."""
-    width = max(page_rect.width, 600)
-    height = max(page_rect.height, 800)
-
-    blocks = sorted(
-        [x for x in page_dict["blocks"] if x["bbox"][1] < height / 2], key=lambda x: x["bbox"][1]
-    )
-
-    email_found = False
-    address_lines = []
-    email = None
-    mobile = None
-    name = None
-    for block in blocks:
-        for line in block["lines"]:
-            for span in filter(
-                lambda x: x["bbox"][0] <= width / 3 and x["text"].strip() != "", line["spans"]
-            ):
-                txt = span["text"].strip()
-                if not email_found:
-                    if m := re.search(r"^\s*email\s+id\s*:\s*(.+?)(?:\s|$)", txt, re.I):
-                        email = m.group(1).strip()
-                        email_found = True
-                    continue
-                if name is None:
-                    name = txt
-                else:
-                    if (
-                        re.search(
-                            r"Mutual\s+Fund|Date\s+Transaction|Folio\s+No|^Date\s*$",
-                            txt,
-                            re.I | re.MULTILINE,
-                        )
-                        or mobile is not None
-                    ):
-                        return InvestorInfo(
-                            email=email,
-                            name=name,
-                            mobile=mobile or "",
-                            address="\n".join(address_lines),
-                        )
-                    elif m := re.search(r"mobile\s*:\s*([+\d]+)(?:s|$)", txt, re.I):
-                        mobile = m.group(1).strip()
-                    address_lines.append(txt)
-    raise CASParseError("Unable to parse investor data")
-
-
-def group_similar_rows(elements_list: List[Iterator[Any]]):
-    """
-    Group elements having similar rows, with a tolerance.
-
-    :param elements_list: List of elements from each page
-    """
-    lines = []
-    for elements in elements_list:
-        sorted_elements = list(sorted(elements, key=itemgetter(1, 0)))
-        y0, y1 = 0, 0
-        if len(sorted_elements) > 0:
-            y0, y1 = sorted_elements[0][1], sorted_elements[0][3]
-        items = []
-        for el in sorted_elements:
-            x2, y2, x3, y3 = el[:4]
-            if abs(y3 - y2) > abs(x3 - x2):
-                # Ignore vertical elements. No useful info there.
-                continue
-            if len(items) > 0 and not (
-                is_close(y3, y1, tol=2) or is_close(y2, y0, tol=2) or y0 <= y2 <= y3 <= y1
-            ):
-                line = "\t\t".join(
-                    [x[4].strip() for x in sorted(items, key=lambda x: x[0]) if x[4].strip()]
-                )
-                if line.strip():
-                    lines.append(line)
-                items = []
-                y0, y1 = el[1], el[3]
-            items.append(el)
-        if len(items) > 0:
-            line = "\t\t".join([x[4].strip() for x in sorted(items, key=lambda x: x[0])])
-            if line.strip():
-                lines.append(line)
-    return lines
-
-
-def cas_pdf_to_text(filename: Union[str, io.IOBase], password) -> PartialCASData:
-    """
-    Parse CAS pdf and returns line data.
-
-    :param filename: CAS pdf file (CAMS or Kfintech)
-    :param password: CAS pdf password
-    :return: partial cas data with FileType, InvestorInfo and lines of data
-    """
-    file_type: FileType = FileType.UNKNOWN
-
-    if isinstance(filename, str):
-        fp = open(filename, "rb")
-    elif hasattr(filename, "read") and hasattr(filename, "close"):  # file-like object
-        fp = filename
-    else:
-        raise CASParseError("Invalid input. filename should be a string or a file like object")
-
-    with fp:
-        try:
-            doc = fitz.Document(stream=fp.read(), filetype="pdf")
-        except Exception as e:
-            raise CASParseError("Unhandled error while opening file :: %s" % (str(e)))
-
-        if doc.needs_pass:
-            rc = doc.authenticate(password)
-            if not rc:
-                raise IncorrectPasswordError("Incorrect PDF password!")
-
-        pages = []
-        investor_info = None
-
-        for page_num, page in enumerate(doc):
-            text_page = page.get_textpage()
-            page_dict = text_page.extractDICT(sort=True)
-            if file_type == FileType.UNKNOWN:
-                file_type = parse_file_type(page_dict["blocks"])
-            blocks = extract_blocks(page_dict, file_type=file_type)
-            sorted_blocks = sorted(blocks, key=itemgetter(1, 0))
-            if investor_info is None:
-                if file_type in (FileType.CAMS, FileType.KFINTECH):
-                    investor_info = parse_investor_info(page_dict, page.rect)
-                elif file_type in (FileType.NSDL, FileType.CDSL) and page_num == 1:
-                    investor_info = parse_investor_info_dp(page_dict, page.rect)
-            if file_type == FileType.NSDL and page_num == 0:
-                # Ignore first page. no useful data
-                continue
-            pages.append(sorted_blocks)
-        lines = group_similar_rows(pages)
-        return PartialCASData(file_type=file_type, investor_info=investor_info, lines=lines)
diff --git a/casparser/parsers/nsdl.py b/casparser/parsers/nsdl.py
new file mode 100644
index 0000000..aa123b2
--- /dev/null
+++ b/casparser/parsers/nsdl.py
@@ -0,0 +1,879 @@
+"""Dedicated NSDL parser.
+
+Consumes structured `Block`/`Cell` data from `pageobj.extract_blocks`
+and produces an `NSDLCASData` directly — no detour through PROD's
+`process_nsdl_text` and its regex tokenisation.
+
+Source-of-truth strategy:
+
+  1. **Page 2 carries the canonical account roster** in a small summary
+     table — one row per demat / MF-folio account with type, broker,
+     DP ID, Client ID, ISIN/scheme count, and balance. We bootstrap
+     accounts from here. This avoids the "false header" pollution that
+     comes from scanning every page for the phrase "Demat Account"
+     (footers, footnotes, paragraph 6/10/etc. all mention it).
+
+  2. **Per-account section headers** match an account in the roster
+     by `(dp_id, client_id)` and become the cursor for subsequent
+     equity / MF / bond rows in that section.
+
+  3. **"Mutual Fund Folios (F)" detailed table** routes to the
+     MF-folio pseudo-account. Rows use x-position-anchored columns
+     so the misplaced lone-digit UCC NSDL occasionally renders in
+     the units column gets recognised as an anomaly and folded back
+     into `ucc`, not into the numeric fields.
+
+Decimals are parsed at the parser level, stripping Indian-format
+commas, so we don't depend on the `MutualFund.fix_float` validator
+(which has a bug where aliased fields with `Optional[Decimal]`
+annotation slip past comma-stripping).
+"""
+
+from __future__ import annotations
+
+import re
+from dataclasses import dataclass
+from decimal import Decimal, InvalidOperation
+from typing import Dict, List, Optional, Tuple
+
+from casparser.enums import FileType
+from casparser.types import (
+    Bond,
+    DematAccount,
+    DematOwner,
+    Equity,
+    MutualFund,
+    NSDLCASData,
+    StatementPeriod,
+)
+
+from . import pageobj
+from ._investor import extract_nsdl_cdsl_investor
+from .pageobj import Block, Cell
+
+# --- patterns ---
+
+ISIN_RE = re.compile(r"^[A-Z]{2}[0-9A-Z]{9}\d$")
+INF_ISIN_RE = re.compile(r"^INF[0-9A-Z]{8}\d$")
+INE_ISIN_RE = re.compile(r"^IN[E9][0-9A-Z]{8}\d$")
+NUMERIC_RE = re.compile(r"^-?[\d,]+(?:\.\d+)?$")
+
+PERIOD_RE = re.compile(
+    r"(?:for\s+the\s+period\s+from|statement\s+for\s+the\s+period\s+from)\s+"
+    r"(\d{2}-[A-Za-z]{3}-\d{4})\s+to\s+(\d{2}-[A-Za-z]{3}-\d{4})",
+    re.I,
+)
+
+DEMAT_TYPE_RE = re.compile(r"^(NSDL|CDSL)\s+Demat\s+Account\s*$", re.I)
+DP_CLIENT_RE = re.compile(
+    r"DP\s*ID\s*:?\s*(\S+?)\s+Client\s*ID\s*:?\s*(\d+)",
+    re.I,
+)
+PAN_RE = re.compile(r"(.+?)\s*\(PAN\s*:\s*([^)]+)\)", re.I)
+MF_FOLIOS_HEADER_RE = re.compile(r"^Mutual\s+Fund\s+Folios\b", re.I)
+
+
+# --- decimal helpers ---
+
+
+def _to_decimal(text) -> Decimal:
+    if text is None:
+        return Decimal(0)
+    s = str(text).replace(",", "").strip()
+    if not s or s in ("-", "--", "N.A", "NA"):
+        return Decimal(0)
+    try:
+        return Decimal(s)
+    except InvalidOperation:
+        return Decimal(0)
+
+
+def _opt_decimal(text) -> Optional[Decimal]:
+    if text is None:
+        return None
+    s = str(text).replace(",", "").strip()
+    if not s or s in ("-", "--", "N.A", "NA"):
+        return None
+    try:
+        return Decimal(s)
+    except InvalidOperation:
+        return None
+
+
+def _looks_numeric(text: str) -> bool:
+    s = text.strip()
+    if not s:
+        return False
+    return bool(NUMERIC_RE.match(s))
+
+
+# --- column anchors (x_left ranges) for the detailed MF Holdings table ---
+
+
+@dataclass(frozen=True)
+class _MFHoldingsCols:
+    # x_left bands for the 10 columns of the detailed MF Holdings
+    # table. Each band must not overlap its neighbour AND must cover
+    # the full range a cell's `x_left` can drift across — PDFium
+    # rounds glyph positions slightly differently across fixtures, so
+    # bands are deliberately wider than the visual column width
+    # (gap-to-gap rather than glyph-to-glyph). The "units" band reaches
+    # ~260 because the units glyph in some NSDL CAS variants starts at
+    # x≈225 and right-aligns; without the wider window the units cell
+    # falls into the inter-column gap and reads as 0.
+    cols = (
+        ("isin_ucc", 15, 75),
+        ("name", 75, 150),
+        ("folio", 150, 200),
+        ("units", 200, 260),
+        ("avg_cost", 260, 310),
+        ("total_cost", 310, 375),
+        ("current_nav", 375, 425),
+        ("current_value", 425, 480),
+        ("pnl", 480, 555),
+        ("returns", 555, 600),
+    )
+
+    def assign(self, cell: Cell) -> Optional[str]:
+        for key, lo, hi in self.cols:
+            if lo <= cell.x_left < hi:
+                return key
+        return None
+
+
+_MF_HOLDINGS = _MFHoldingsCols()
+
+
+# --- column anchors for the summary Corporate-Bonds table ---
+#
+# The NSDL-flavour bonds table on a demat-account page renders 8 data
+# cells per row. Two of them ('frequency' text + 'coupon rate' numeric)
+# share an x-band so they can't be distinguished by x alone — see
+# `_parse_bond_summary_row` for how the text/numeric discriminator is
+# applied within that band.
+@dataclass(frozen=True)
+class _BondSummaryCols:
+    cols = (
+        ("isin", 15, 80),
+        ("name", 80, 175),
+        ("coupon_band", 175, 240),  # frequency (text) + coupon (numeric)
+        ("maturity", 240, 310),
+        ("num_bonds", 310, 390),
+        ("face_value", 390, 510),
+        ("value", 510, 600),
+    )
+
+    def assign(self, cell: Cell) -> Optional[str]:
+        for key, lo, hi in self.cols:
+            if lo <= cell.x_left < hi:
+                return key
+        return None
+
+
+_BOND_SUMMARY = _BondSummaryCols()
+
+
+# --- account key utilities ---
+
+
+def _full_type(type_word: str) -> str:
+    """`NSDL`/`CDSL` -> `NSDL Demat Account`/`CDSL Demat Account` to
+    match the convention used elsewhere in the codebase."""
+    return f"{type_word.upper()} Demat Account"
+
+
+def _account_key(type_word: str, dp_id: str, client_id: str) -> Tuple[str, str, str]:
+    return (type_word.upper(), dp_id.strip(), client_id.strip())
+
+
+# --- parser entry point ---
+
+
+def parse_nsdl(
+    pdf_path: str,
+    password: str,
+    file_type: FileType = FileType.NSDL,
+    *,
+    _doc=None,
+) -> NSDLCASData:
+    # Extract atoms once, then derive both the structured Blocks the
+    # holdings parser needs and the investor info from the same pages.
+    atoms = pageobj.extract_atoms(pdf_path, password, _doc=_doc)
+    blocks = pageobj.blocks_from_atoms(atoms)
+    period = _find_period(blocks) or StatementPeriod(**{"from": "", "to": ""})
+
+    # Phase 1: bootstrap accounts from page-2 summary table.
+    accounts_by_key: Dict[Tuple[str, str, str], DematAccount] = {}
+    ordered_accounts: List[DematAccount] = []
+    mf_folios_account: Optional[DematAccount] = None
+
+    pending_owners: List[DematOwner] = []  # owners harvested from
+    # the most recent 'in the (single|joint) name of' header; consumed
+    # by the next summary-demat row and reset on each new header.
+
+    for b in blocks:
+        if b.page != 2:
+            continue
+        txt = b.text()
+        ltxt = txt.lower()
+        if (
+            "in the single name of" in ltxt
+            or "in the joint names of" in ltxt
+            or "in the joint name of" in ltxt
+        ):
+            pending_owners = []
+            continue
+        # Capture owner names that follow.
+        if PAN_RE.search(txt):
+            # `name1 (PAN:...)\nname2 (PAN:...)` is one cell with \n.
+            for m in PAN_RE.finditer(txt):
+                pending_owners.append(
+                    DematOwner(
+                        name=m.group(1).strip(),
+                        PAN=m.group(2).strip(),
+                    )
+                )
+            continue
+        # Summary demat-account row
+        if _is_summary_demat_row(b):
+            ac, key = _account_from_summary_row(b, list(pending_owners))
+            if key not in accounts_by_key:
+                accounts_by_key[key] = ac
+                ordered_accounts.append(ac)
+            continue
+        # Summary MF Folios row
+        if _is_summary_mf_folios_row(b):
+            if mf_folios_account is None:
+                mf_folios_account = _mf_folios_account_from_summary(b, list(pending_owners))
+                ordered_accounts.append(mf_folios_account)
+            continue
+
+    # Phase 2: walk all blocks; identify per-account section headers
+    # and parse subsequent holdings into the matching account.
+    #
+    # `cur_section` (equities / mfunds / bonds) is set by the small
+    # section-marker blocks ('Equity Shares', 'Mutual Funds (M)',
+    # 'Corporate Bonds (C)' etc.) and disambiguates the otherwise-
+    # identical 18-cell detailed-table header — without it, MF and
+    # bond rows on a CDSL detailed page get misrouted into equities.
+    # `cur_mode` is the final routing key (one of
+    # 'equities_summary', 'equities_detailed', 'mfunds_summary',
+    # 'mfunds_detailed', 'mf_holdings', 'bonds_summary',
+    # 'bonds_detailed') chosen by `_detect_mode_from_header` once the
+    # column-header row arrives.
+    page_blocks = [b for b in blocks if b.page > 2]
+    cur_account: Optional[DematAccount] = None
+    cur_mode: Optional[str] = None
+    cur_section: Optional[str] = None
+
+    i = 0
+    while i < len(page_blocks):
+        b = page_blocks[i]
+        txt = b.text()
+        ltxt = txt.lower()
+
+        # Per-account section header. Same-block form (single-name
+        # accounts) or split across 3 blocks (joint-name accounts).
+        ac_key, consumed = _try_per_account_header(page_blocks, i)
+        if ac_key is not None:
+            cur_account = accounts_by_key.get(ac_key)
+            cur_mode = None
+            cur_section = None
+            i += consumed
+            continue
+
+        # MF Folios detailed-table header
+        if "mutual fund folios (f)" in ltxt:
+            cur_account = mf_folios_account
+            cur_mode = "mf_holdings"
+            cur_section = "mfunds"
+            i += 1
+            continue
+
+        # Table-header rows tell us which kind of holdings table follows.
+        if cur_account is not None:
+            mode = _detect_mode_from_header(b, cur_section)
+            if mode is not None:
+                cur_mode = mode
+                i += 1
+                continue
+            if _is_total_row(b):
+                i += 1
+                continue
+            sec = _section_marker_kind(b)
+            if sec is not None:
+                cur_section = sec
+                # Don't clear cur_mode here — for unsupported sections
+                # (preference shares, AIF, etc.) we want subsequent
+                # rows to fall through and be ignored. cur_mode is
+                # cleared/reset when the next table header is seen.
+                cur_mode = None
+                i += 1
+                continue
+
+        # Holdings rows
+        if cur_account is None or cur_mode is None:
+            i += 1
+            continue
+        if cur_mode == "equities_summary":
+            eq = _parse_equity_row(b, detailed=False)
+            if eq:
+                cur_account.equities.append(eq)
+        elif cur_mode == "equities_detailed":
+            eq = _parse_equity_row(b, detailed=True)
+            if eq:
+                cur_account.equities.append(eq)
+        elif cur_mode == "mfunds_summary":
+            mf = _parse_summary_mf_row(b)
+            if mf:
+                cur_account.mutual_funds.append(mf)
+        elif cur_mode == "mfunds_detailed":
+            mf = _parse_detailed_mf_row(b)
+            if mf:
+                cur_account.mutual_funds.append(mf)
+        elif cur_mode == "mf_holdings":
+            mf = _parse_mf_holdings_row(b)
+            if mf:
+                cur_account.mutual_funds.append(mf)
+        elif cur_mode == "bonds_summary":
+            bd = _parse_bond_summary_row(b)
+            if bd:
+                cur_account.bonds.append(bd)
+        elif cur_mode == "bonds_detailed":
+            bd = _parse_bond_detailed_row(b)
+            if bd:
+                cur_account.bonds.append(bd)
+        i += 1
+
+    return NSDLCASData(
+        statement_period=period,
+        accounts=ordered_accounts,
+        investor_info=extract_nsdl_cdsl_investor(
+            pdf_path,
+            password,
+            _atoms=atoms,
+        ),
+        file_type=file_type,
+    )
+
+
+# --- summary-row recognisers (page 2) ---
+
+
+def _is_summary_demat_row(block: Block) -> bool:
+    """Page-2 summary row. Two physical layouts produce the same logical
+    row depending on how PDFium clusters the broker name and DP/Client
+    line:
+
+      4-cell form: ``Type | "<BROKER>\\nDP ID:... Client ID:..." | folios | value``
+        Broker name and DP-ID line share one cell (joined with newline).
+
+      5-cell form: ``Type | "<BROKER>" | "DP ID:... Client ID:..." | folios | value``
+        Broker name and DP-ID line render as separate cells.
+
+    Both are accepted; we discriminate by locating the cell whose text
+    contains the DP/Client pattern.
+    """
+    if len(block.cells) not in (4, 5):
+        return False
+    if not DEMAT_TYPE_RE.match(block.cells[0].text.strip()):
+        return False
+    return any(DP_CLIENT_RE.search(c.text) for c in block.cells[1:])
+
+
+def _is_summary_mf_folios_row(block: Block) -> bool:
+    if len(block.cells) != 4:
+        return False
+    if not MF_FOLIOS_HEADER_RE.match(block.cells[0].text.strip()):
+        return False
+    return True
+
+
+def _account_from_summary_row(
+    block: Block, owners: List[DematOwner]
+) -> Tuple[DematAccount, Tuple[str, str, str]]:
+    """Build a DematAccount from a page-2 summary row, handling both the
+    4-cell and 5-cell layouts (see :func:`_is_summary_demat_row`)."""
+    type_word = DEMAT_TYPE_RE.match(block.cells[0].text.strip()).group(1).upper()
+    # Locate the cell carrying the DP/Client identifiers; everything
+    # before it (cell index 1, possibly inline in the same cell) is the
+    # broker name.
+    dp_cell_idx = next(
+        (i for i in range(1, len(block.cells)) if DP_CLIENT_RE.search(block.cells[i].text)),
+        1,
+    )
+    dp_cell_text = block.cells[dp_cell_idx].text
+    dpc = DP_CLIENT_RE.search(dp_cell_text)
+    dp_id = dpc.group(1) if dpc else ""
+    client_id = dpc.group(2) if dpc else ""
+    # Broker = the dp-cell text minus the DP/Client suffix, falling
+    # back to the cell immediately before it for the 5-cell layout.
+    broker_lines = [
+        ln.strip() for ln in dp_cell_text.split("\n") if ln.strip() and not DP_CLIENT_RE.search(ln)
+    ]
+    if broker_lines:
+        broker = broker_lines[0]
+    elif dp_cell_idx >= 2:
+        broker = block.cells[dp_cell_idx - 1].text.strip()
+    else:
+        broker = ""
+    # Numerics (folios, balance) are the last two cells.
+    folios = int(_to_decimal(block.cells[-2].text))
+    balance = _to_decimal(block.cells[-1].text)
+    ac = DematAccount(
+        name=broker,
+        type=_full_type(type_word),
+        dp_id=dp_id,
+        client_id=client_id,
+        folios=folios,
+        balance=balance,
+        owners=list(owners),
+        equities=[],
+        mutual_funds=[],
+        bonds=[],
+    )
+    return ac, _account_key(type_word, dp_id, client_id)
+
+
+def _mf_folios_account_from_summary(block: Block, owners: List[DematOwner]) -> DematAccount:
+    # cells: ['Mutual Fund Folios', '25 Folios', '44', '5,37,10,359.39']
+    folios_m = re.search(r"(\d+)", block.cells[1].text)
+    folios = int(folios_m.group(1)) if folios_m else 0
+    balance = _to_decimal(block.cells[3].text)
+    return DematAccount(
+        name="Mutual Fund Folios",
+        type="Mutual Fund Folios",
+        dp_id="",
+        client_id="",
+        folios=folios,
+        balance=balance,
+        owners=list(owners),
+        equities=[],
+        mutual_funds=[],
+        bonds=[],
+    )
+
+
+# --- per-account section headers ---
+
+
+def _try_per_account_header(
+    blocks: List[Block], i: int
+) -> Tuple[Optional[Tuple[str, str, str]], int]:
+    """A per-account header marks the start of a holdings section for
+    a specific account. Returns `(account_key, blocks_consumed)`.
+
+    Two header layouts:
+      A) **Single-block (single-name account)** — one block has TYPE
+         + DP/Client in one row of 5 cells, plus broker name +
+         'ACCOUNT HOLDER' + PAN.
+      B) **Split (joint-name account)** — the header spans three
+         consecutive blocks: `<TYPE> Demat Account | ACCOUNT HOLDERS`,
+         `<BROKER> | <NAME1> (PAN:…)`, `DP ID:… Client ID:… | <NAME2>
+         (PAN:…)`. We scan ahead up to 3 blocks to gather the DP/Client.
+
+    Footnotes / paragraph text that happens to mention 'demat account'
+    are rejected because they have too many cells / too little
+    structure.
+    """
+    b = blocks[i]
+    txt = b.text()
+    type_m = re.search(r"\b(NSDL|CDSL)\b\s+Demat\s+Account", txt, re.I)
+    if not type_m:
+        return None, 1
+
+    # Case A: DP/Client in the same block
+    dpc = DP_CLIENT_RE.search(txt)
+    if dpc and 3 <= len(b.cells) <= 8 and len(txt) < 500:
+        return _account_key(type_m.group(1), dpc.group(1), dpc.group(2)), 1
+
+    # Case B: look ahead for DP/Client (joint-account header form)
+    if "account holders" in txt.lower() or "account holder" in txt.lower():
+        for j in range(1, 4):
+            if i + j >= len(blocks):
+                break
+            nxt = blocks[i + j]
+            if nxt.page != b.page:
+                break
+            dpc = DP_CLIENT_RE.search(nxt.text())
+            if dpc:
+                return _account_key(type_m.group(1), dpc.group(1), dpc.group(2)), j + 1
+
+    return None, 1
+
+
+def _detect_mode_from_header(
+    block: Block,
+    cur_section: Optional[str] = None,
+) -> Optional[str]:
+    """Return the holdings-mode this column-header row implies, or
+    None if it isn't a header row.
+
+    `cur_section` (set by the most recent section-marker block) is used
+    to disambiguate the 18-cell detailed table header — its column set
+    is identical for equities, mutual funds and bonds, and only the
+    preceding section marker tells us which.
+    """
+    if re.search(r"\b(IN[EF9][0-9A-Z]{8}\d)\b", block.text(), re.I):
+        return None  # has an ISIN → it's a data row
+    txt = block.text().lower().replace("\n", " ").replace("\t\t", " ")
+    # MF Holdings (F) — must check before the simpler "folio no" guard
+    # since this header also carries "ISIN Description" and "Folio No.".
+    if "folio no" in txt and ("average" in txt or "total cost" in txt):
+        return "mf_holdings"
+    # Detailed CDSL/NSDL holdings table — identical column set for
+    # equities / mutual funds / bonds; disambiguate by section.
+    if "current bal" in txt and ("market price" in txt or "value in" in txt):
+        if cur_section == "bonds":
+            return "bonds_detailed"
+        if cur_section == "mfunds":
+            return "mfunds_detailed"
+        return "equities_detailed"
+    # Summary bonds table on a demat-account page.
+    if "coupon" in txt and ("maturity" in txt or "frequency" in txt):
+        return "bonds_summary"
+    # Summary equity table.
+    if "stock symbol" in txt and "company name" in txt:
+        return "equities_summary"
+    # Summary MF table on per-account page.
+    if "isin description" in txt and ("nav" in txt or "value in" in txt):
+        return "mfunds_summary"
+    return None
+
+
+# Section markers are short blocks (1-2 cells) whose text labels which
+# kind of holdings the following table contains.  Mapping is from the
+# lowercased marker text to a section name used to disambiguate detailed
+# table headers.  Sections not in the map ('preference shares (p)',
+# 'alternate investment fund (a)', etc.) are still recognised as
+# markers — they clear the active mode so subsequent rows are ignored
+# — but route their rows to no holdings list.
+_SECTION_MARKER_MAP = {
+    "equity shares": "equities",
+    "equities (e)": "equities",
+    "mutual funds (m)": "mfunds",
+    "mutual funds units held with the amc": "mfunds",
+    "corporate bonds (c)": "bonds",
+}
+
+# Markers we recognise as 'a new section starts here' but whose rows
+# we don't parse — keeps cur_mode cleared so unrelated subsequent rows
+# don't get misrouted into the previous section's list.
+_UNSUPPORTED_SECTION_MARKERS = frozenset(
+    {
+        "preference shares (p)",
+        "alternate investment fund (a)",
+        "money market instruments (i)",
+        "securitised instruments (s)",
+        "government securities (g)",
+        "postal saving scheme (o)",
+        "national pension system (n)",
+        "zero coupon zero principal(z)",
+    }
+)
+
+
+def _section_marker_kind(block: Block) -> Optional[str]:
+    """Return the section label ('equities' / 'mfunds' / 'bonds' /
+    'unsupported') if `block` is a section marker, else None."""
+    if len(block.cells) > 2:
+        return None
+    txt = block.text().strip().lower()
+    if txt in _SECTION_MARKER_MAP:
+        return _SECTION_MARKER_MAP[txt]
+    if txt in _UNSUPPORTED_SECTION_MARKERS:
+        return "unsupported"
+    return None
+
+
+# --- generic recognisers ---
+
+
+def _find_period(blocks: List[Block]) -> Optional[StatementPeriod]:
+    for b in blocks:
+        m = PERIOD_RE.search(b.text())
+        if m:
+            return StatementPeriod(**{"from": m.group(1), "to": m.group(2)})
+    return None
+
+
+def _is_table_header(block: Block) -> bool:
+    """Column-label row (no ISIN, multiple recognisable header words)."""
+    txt = block.text().lower().replace("\t\t", " ").replace("\n", " ")
+    if re.search(r"\b(IN[EF9][0-9A-Z]{8}\d)\b", txt, re.I):
+        return False
+    keywords = (
+        "isin description",
+        "no. of\nunits",
+        "no. of\nshares",
+        "stock symbol",
+        "current bal",
+        "free bal",
+        "market price",
+        "value in",
+        "total cost",
+        "current nav",
+        "unrealised",
+        "annualised",
+        "isin description folio",
+        "isin description no.",
+    )
+    return sum(1 for k in keywords if k in txt) >= 2
+
+
+def _is_total_row(block: Block) -> bool:
+    first = block.cells[0].text.strip().lower() if block.cells else ""
+    return first in ("sub total", "total", "grand total")
+
+
+# --- equity row ---
+
+
+def _parse_equity_row(block: Block, detailed: bool = False) -> Optional[Equity]:
+    """Equity row. Cell 0 carries the ISIN (sometimes with ticker on a
+    second line). Trailing cells are numerics.
+
+    - **Summary form** (NSDL-account 'Equity Shares' table): 4
+      numerics — face_value, num_shares, price, value. We take the
+      last three.
+    - **Detailed form** (CDSL-account / extended-NSDL table): 11
+      numerics — current_bal (=num_shares), free, lent, pledge_setup,
+      locked_in, safekeep, earmarked, pledged, pledgee, market_price,
+      value. We take numerics[0] for num_shares and the last two for
+      price / value.
+    """
+    if not block.cells:
+        return None
+    first = block.cells[0].text
+    first_token = first.split("\n", 1)[0].strip()
+    if not ISIN_RE.match(first_token):
+        return None
+    isin = first_token
+
+    name_cell = block.cells[1].text.replace("\n", " ").strip() if len(block.cells) > 1 else None
+
+    numerics = [c.text.strip() for c in block.cells[2:] if _looks_numeric(c.text)]
+    if len(numerics) < 3:
+        return None
+    if detailed or len(numerics) >= 5:
+        num_shares = _to_decimal(numerics[0])
+    else:
+        num_shares = _to_decimal(numerics[-3])
+    price = _to_decimal(numerics[-2])
+    value = _to_decimal(numerics[-1])
+
+    return Equity(
+        name=name_cell,
+        isin=isin,
+        num_shares=num_shares,
+        price=price,
+        value=value,
+    )
+
+
+# --- summary MF row (per-account 'Mutual Funds (M)' table) ---
+
+
+def _parse_summary_mf_row(block: Block) -> Optional[MutualFund]:
+    if not block.cells:
+        return None
+    first = block.cells[0].text.strip()
+    if not ISIN_RE.match(first):
+        return None
+    isin = first
+    name = block.cells[1].text.replace("\n", " ").strip() if len(block.cells) > 1 else None
+    numerics = [c.text.strip() for c in block.cells[2:] if _looks_numeric(c.text)]
+    if len(numerics) < 3:
+        return None
+    balance = _to_decimal(numerics[0])
+    nav = _to_decimal(numerics[1])
+    value = _to_decimal(numerics[2])
+    return MutualFund(
+        name=name,
+        isin=isin,
+        balance=balance,
+        nav=nav,
+        value=value,
+    )
+
+
+# --- detailed MF Holdings row ---
+
+
+def _parse_mf_holdings_row(block: Block) -> Optional[MutualFund]:
+    """Detailed holdings row: ISIN, UCC, scheme name, folio, 7 numerics.
+    Cells map to columns by x-position. Out-of-band cells (e.g., the
+    lone UCC `8` PDFium renders at the units column's x position) are
+    flagged as anomalies and folded into the UCC field if missing."""
+    if not block.cells:
+        return None
+    by_col: Dict[str, Cell] = {}
+    anomalies: List[Cell] = []
+    for cell in block.cells:
+        key = _MF_HOLDINGS.assign(cell)
+        if key is None or key in by_col:
+            anomalies.append(cell)
+        else:
+            by_col[key] = cell
+
+    if "isin_ucc" not in by_col:
+        return None
+    isin_cell = by_col["isin_ucc"].text
+    lines = [ln.strip() for ln in isin_cell.split("\n") if ln.strip()]
+    if not lines or not INF_ISIN_RE.match(lines[0]):
+        return None
+    isin = lines[0]
+    ucc: Optional[str] = lines[1] if len(lines) > 1 else None
+
+    PLACEHOLDER_UCCS = {"NOT AVAILABLE", "NA", "N.A.", ""}
+    needs_ucc = ucc is None or ucc.upper() in PLACEHOLDER_UCCS
+    if anomalies and needs_ucc:
+        for a in anomalies:
+            t = a.text.strip()
+            if t and len(t) <= 32:
+                ucc = t
+                break
+
+    name = by_col["name"].text.replace("\n", " ").strip() if "name" in by_col else None
+    folio = by_col["folio"].text.strip() if "folio" in by_col else None
+
+    balance = _to_decimal(by_col.get("units").text if "units" in by_col else None)
+    avg_cost = _opt_decimal(by_col.get("avg_cost").text if "avg_cost" in by_col else None)
+    total_cost = _opt_decimal(by_col.get("total_cost").text if "total_cost" in by_col else None)
+    nav = _to_decimal(by_col.get("current_nav").text if "current_nav" in by_col else None)
+    value = _to_decimal(by_col.get("current_value").text if "current_value" in by_col else None)
+    pnl = _opt_decimal(by_col.get("pnl").text if "pnl" in by_col else None)
+    ret = _opt_decimal(by_col.get("returns").text if "returns" in by_col else None)
+
+    return MutualFund(
+        name=name,
+        isin=isin,
+        balance=balance,
+        nav=nav,
+        value=value,
+        avg_cost=avg_cost,
+        total_cost=total_cost,
+        ucc=ucc,
+        folio=folio,
+        pnl=pnl,
+        **{"return": ret},
+    )
+
+
+# --- detailed MF row (CDSL-style 'Mutual Funds (M)' table) ---
+
+
+def _parse_detailed_mf_row(block: Block) -> Optional[MutualFund]:
+    """Detailed 'Mutual Funds (M)' row on a CDSL demat-account page.
+
+    Same 18-column header / 13-cell data row as detailed equities;
+    ISINs start with `INF` rather than `INE`. We surface `num_shares`
+    as `balance` and the last two numerics as `nav` / `value`.
+    """
+    if not block.cells:
+        return None
+    first = block.cells[0].text.strip()
+    if not INF_ISIN_RE.match(first):
+        return None
+    isin = first
+    name = block.cells[1].text.replace("\n", " ").strip() if len(block.cells) > 1 else None
+    numerics = [c.text.strip() for c in block.cells[2:] if _looks_numeric(c.text)]
+    if len(numerics) < 3:
+        return None
+    balance = _to_decimal(numerics[0])
+    nav = _to_decimal(numerics[-2])
+    value = _to_decimal(numerics[-1])
+    return MutualFund(
+        name=name,
+        isin=isin,
+        balance=balance,
+        nav=nav,
+        value=value,
+    )
+
+
+# --- bond rows ---
+
+
+def _parse_bond_summary_row(block: Block) -> Optional[Bond]:
+    """NSDL-flavour summary bonds row (8 data cells).
+
+    Cells map to columns by x-position via `_BOND_SUMMARY`. Two cells
+    share the 'coupon_band' x range — the textual one is the coupon
+    frequency ("Once a year", "On Maturity") and the numeric one is the
+    coupon rate (e.g. 8.10). They're discriminated by ``_looks_numeric``.
+    """
+    if not block.cells:
+        return None
+    first = block.cells[0].text.split("\n", 1)[0].strip()
+    if not ISIN_RE.match(first):
+        return None
+    isin = first
+
+    by_col: Dict[str, List[Cell]] = {}
+    for cell in block.cells:
+        key = _BOND_SUMMARY.assign(cell)
+        if key is None:
+            continue
+        by_col.setdefault(key, []).append(cell)
+
+    name = None
+    if "name" in by_col:
+        name = " ".join(c.text.replace("\n", " ").strip() for c in by_col["name"]).strip() or None
+
+    coupon_rate: Optional[Decimal] = None
+    coupon_frequency: Optional[str] = None
+    for c in by_col.get("coupon_band", []):
+        if _looks_numeric(c.text):
+            coupon_rate = _opt_decimal(c.text)
+        else:
+            txt = c.text.replace("\n", " ").strip()
+            if txt:
+                coupon_frequency = txt
+
+    maturity_date: Optional[str] = None
+    if "maturity" in by_col:
+        maturity_date = by_col["maturity"][0].text.strip() or None
+
+    num_bonds = _to_decimal(by_col["num_bonds"][0].text) if "num_bonds" in by_col else Decimal(0)
+    face_value = _opt_decimal(by_col["face_value"][0].text) if "face_value" in by_col else None
+    value = _to_decimal(by_col["value"][0].text) if "value" in by_col else Decimal(0)
+
+    return Bond(
+        name=name,
+        isin=isin,
+        num_bonds=num_bonds,
+        value=value,
+        face_value=face_value,
+        coupon_rate=coupon_rate,
+        coupon_frequency=coupon_frequency,
+        maturity_date=maturity_date,
+    )
+
+
+def _parse_bond_detailed_row(block: Block) -> Optional[Bond]:
+    """CDSL-flavour detailed bonds row (13 data cells, same layout as
+    detailed equities). Yields only `num_bonds`, `market_price` and
+    `value` — the detailed table doesn't carry coupon / maturity /
+    face-value information.
+    """
+    if not block.cells:
+        return None
+    first = block.cells[0].text.strip()
+    if not ISIN_RE.match(first):
+        return None
+    isin = first
+    name = block.cells[1].text.replace("\n", " ").strip() if len(block.cells) > 1 else None
+    numerics = [c.text.strip() for c in block.cells[2:] if _looks_numeric(c.text)]
+    if len(numerics) < 3:
+        return None
+    num_bonds = _to_decimal(numerics[0])
+    market_price = _opt_decimal(numerics[-2])
+    value = _to_decimal(numerics[-1])
+    return Bond(
+        name=name,
+        isin=isin,
+        num_bonds=num_bonds,
+        value=value,
+        market_price=market_price,
+    )
diff --git a/casparser/parsers/pageobj.py b/casparser/parsers/pageobj.py
new file mode 100644
index 0000000..057de35
--- /dev/null
+++ b/casparser/parsers/pageobj.py
@@ -0,0 +1,435 @@
+"""Page-object based block extractor for NSDL/CDSL.
+
+PROD's PyMuPDF flow:
+  extractDICT(sort=True) → blocks → lines → spans
+  - one *span* ≈ one PDF text-show operation
+  - lines within a block joined by `\\n`, blocks joined by `\\u2029`
+  - PROD's `extract_blocks` further merges close-y lines into one
+    `\\t\\t`-joined "group line" within the block.
+
+pypdfium2's page-object API exposes the same granularity directly:
+`FPDFPage_GetObject` yields one object per text-show op, with bounds
+from `FPDFPageObj_GetBounds` and text from `FPDFTextObj_GetText`.
+
+This is strictly better than the content-stream-char walker in nsdl.py
+because each text-show op stays an atomic unit — no need to guess its
+boundary from x-jumps, so cells whose internal gap is smaller than
+inter-column gap (the NSDL/CDSL MF Holdings case) are no longer
+mis-merged.
+
+Layout reconstruction:
+1.  Extract one atom per text-show op (drop Mangal/Devanagari font).
+2.  Dedup atoms by `(x_left, y_top, text)` — CAS PDFs render the
+    top banner twice, both copies are present as separate objects.
+3.  Cluster atoms into *raw lines* by y_top within `Y_LINE_TOL`.
+4.  Cluster raw lines into *logical blocks* — consecutive raw lines
+    whose top-to-top y-gap is `≤ Y_BLOCK_TOL`. This is the analogue
+    of PyMuPDF's block grouping plus PROD's close-y line merging.
+5.  Within a block, group atoms into *columns* by x-range overlap,
+    anchored on the topmost atom in each column. Within a column,
+    sort atoms top-down and join with `\\n`. Sort columns left→right
+    and join with `\\t\\t`.
+6.  Join blocks (within page) with `\\u2029`, pages with `\\u2029` too.
+
+The output is compatible with `text.split("\\u2029")` in
+`process_nsdl_text` / `process_cdsl_text`.
+"""
+
+from __future__ import annotations
+
+import ctypes
+from dataclasses import dataclass
+from typing import List, Optional, Tuple
+
+import pypdfium2 as pdfium
+import pypdfium2.raw as pdfium_raw
+
+from .extract import _is_non_latin_font
+
+# y_top tolerance for grouping atoms into one *raw line*. Text-show ops
+# on the same visual line share an identical baseline; 1.5pt absorbs
+# any sub-pixel jitter without merging neighbouring lines.
+Y_LINE_TOL = 1.5
+
+# Top-to-top y-gap threshold for keeping consecutive raw lines in the
+# same logical *block*. NSDL/CDSL tables use ~7pt line spacing within
+# a row (multi-line ISIN+UCC cells, multi-line scheme names) and ~11pt
+# between rows. 9pt cleanly separates them.
+Y_BLOCK_TOL = 9.0
+
+# Buffer sizes for ctypes
+_TEXT_BUF_SIZE = 2048  # bytes (UTF-16LE), so up to 1023 chars per atom
+_FONT_BUF_SIZE = 128
+
+
+@dataclass
+class Atom:
+    """One text-show operation on a page.
+
+    `stream_seq` is the position of this object in the content-stream
+    walk (counting both text and non-text objects). Two text atoms
+    that are *consecutive* in the stream — no PATH/IMAGE/etc. object
+    between them — have `stream_seq` differing by exactly 1, which is
+    how we tell PyMuPDF-style merge cases apart from same-row neighbours
+    that PyMuPDF would keep separate.
+    """
+
+    x_left: float
+    x_right: float
+    y_top: float
+    y_bot: float
+    text: str
+    font: str
+    stream_seq: int = 0
+
+
+def _read_text_obj(obj, tp_handle, buf, fname_buf) -> Tuple[str, str]:
+    """Decode a text object's content and font name. Returns ('', '') if
+    the object has no readable text or its font is non-Latin."""
+    cc = pdfium_raw.FPDFTextObj_GetText(obj, tp_handle, buf, _TEXT_BUF_SIZE)
+    # `cc` is byte length INCLUDING null terminator. Strip the null.
+    text = bytes(buf)[: max(0, cc - 2)].decode("utf-16-le", errors="replace")
+    if not text.strip():
+        return "", ""
+    font = pdfium_raw.FPDFTextObj_GetFont(obj)
+    fn = pdfium_raw.FPDFFont_GetBaseFontName(font, fname_buf, _FONT_BUF_SIZE)
+    fname = fname_buf.raw[: max(0, fn - 1)].decode("utf-8", errors="replace") if fn > 0 else ""
+    if _is_non_latin_font(fname):
+        return "", ""
+    return text, fname
+
+
+class _StreamCounter:
+    __slots__ = ("v",)
+
+    def __init__(self):
+        self.v = 0
+
+    def tick(self):
+        self.v += 1
+        return self.v
+
+
+def _iter_text_objects(parent_obj_or_page, is_form: bool, counter: _StreamCounter):
+    """Yield (text_object, stream_seq) tuples for every text page-object,
+    recursing into Form XObjects. `counter` advances once for each
+    object visited (text *and* non-text) — its value at yield time is
+    that text-show op's stream position, so two atoms with consecutive
+    counter values had nothing between them in the PDF's content stream.
+    Bounds reported by `FPDFPageObj_GetBounds` are already in page
+    coordinates regardless of nesting depth."""
+    if is_form:
+        n = pdfium_raw.FPDFFormObj_CountObjects(parent_obj_or_page)
+
+        def get_obj(i):
+            return pdfium_raw.FPDFFormObj_GetObject(parent_obj_or_page, i)
+    else:
+        n = pdfium_raw.FPDFPage_CountObjects(parent_obj_or_page)
+
+        def get_obj(i):
+            return pdfium_raw.FPDFPage_GetObject(parent_obj_or_page, i)
+
+    for i in range(n):
+        obj = get_obj(i)
+        t = pdfium_raw.FPDFPageObj_GetType(obj)
+        seq = counter.tick()
+        if t == pdfium_raw.FPDF_PAGEOBJ_TEXT:
+            yield obj, seq
+        elif t == pdfium_raw.FPDF_PAGEOBJ_FORM:
+            yield from _iter_text_objects(obj, is_form=True, counter=counter)
+
+
+def extract_atoms(
+    pdf_path: str,
+    password: str,
+    *,
+    _doc: "Optional[pdfium.PdfDocument]" = None,
+) -> List[List[Atom]]:
+    """Return one list of Atoms per page (in object-index order).
+    Recurses into Form XObjects (CDSL CAS PDFs nest their entire page
+    inside a top-level FORM).
+
+    When `_doc` is provided, reuse it instead of re-opening the PDF —
+    the dispatcher opens the document exactly once and threads it
+    through detect / parser / investor extractor.
+    """
+    doc = _doc if _doc is not None else pdfium.PdfDocument(pdf_path, password=password)
+    pages: List[List[Atom]] = []
+    left = ctypes.c_float()
+    bottom = ctypes.c_float()
+    right = ctypes.c_float()
+    top = ctypes.c_float()
+    buf = (ctypes.c_ushort * (_TEXT_BUF_SIZE // 2))()
+    fname_buf = (ctypes.c_char * _FONT_BUF_SIZE)()
+    for page in doc:
+        page_handle = page.raw
+        tp = page.get_textpage()
+        tp_handle = tp.raw
+        atoms: List[Atom] = []
+        seen: set = set()  # dedup by (x_left, y_top, text)
+        counter = _StreamCounter()
+        for obj, seq in _iter_text_objects(page_handle, is_form=False, counter=counter):
+            text, fname = _read_text_obj(obj, tp_handle, buf, fname_buf)
+            if not text:
+                continue
+            pdfium_raw.FPDFPageObj_GetBounds(
+                obj,
+                ctypes.byref(left),
+                ctypes.byref(bottom),
+                ctypes.byref(right),
+                ctypes.byref(top),
+            )
+            xl, xr, yt, yb = left.value, right.value, top.value, bottom.value
+            key = (round(xl, 1), round(yt, 1), text)
+            if key in seen:
+                continue
+            seen.add(key)
+            atoms.append(Atom(xl, xr, yt, yb, text, fname, stream_seq=seq))
+        pages.append(_dedupe_overlapping(atoms))
+    return pages
+
+
+def _dedupe_overlapping(atoms: List[Atom]) -> List[Atom]:
+    """CDSL CAS PDFs render some text twice — once for visible glyphs
+    and once for the text layer used by accessibility tools. The two
+    copies appear as separate page objects at slightly different
+    x-positions but with identical text content. PyMuPDF folds them
+    into one span; here we drop the later copy when an earlier atom
+    at the same y already contains the same text within an
+    overlapping x-range."""
+    if not atoms:
+        return []
+    # Group by rounded y_top so we only compare within the same line.
+    by_line: dict = {}
+    for a in atoms:
+        by_line.setdefault(round(a.y_top, 1), []).append(a)
+
+    keep: List[Atom] = []
+    for y, line_atoms in by_line.items():
+        kept_at_y: List[Atom] = []
+        for a in line_atoms:
+            atxt = a.text.strip()
+            is_dup = False
+            for k in kept_at_y:
+                ktxt = k.text.strip()
+                if atxt != ktxt:
+                    continue
+                # x-range overlap?
+                if a.x_left < k.x_right and k.x_left < a.x_right:
+                    is_dup = True
+                    break
+            if not is_dup:
+                kept_at_y.append(a)
+        keep.extend(kept_at_y)
+    return keep
+
+
+def _cluster_raw_lines(atoms: List[Atom]) -> List[List[Atom]]:
+    """Group atoms into raw lines by y_top within `Y_LINE_TOL`."""
+    if not atoms:
+        return []
+    sorted_atoms = sorted(atoms, key=lambda a: (-a.y_top, a.x_left))
+    lines: List[List[Atom]] = [[sorted_atoms[0]]]
+    cur_y = sorted_atoms[0].y_top
+    for a in sorted_atoms[1:]:
+        if abs(a.y_top - cur_y) <= Y_LINE_TOL:
+            lines[-1].append(a)
+            # Stable anchor: keep the first y_top so jitter doesn't drift
+        else:
+            lines.append([a])
+            cur_y = a.y_top
+    return lines
+
+
+def _cluster_blocks(raw_lines: List[List[Atom]]) -> List[List[Atom]]:
+    """Merge consecutive raw lines whose top-to-top y-gap ≤ Y_BLOCK_TOL
+    into one block. Returns a flat list of atoms per block."""
+    if not raw_lines:
+        return []
+    blocks: List[List[Atom]] = [list(raw_lines[0])]
+    prev_y = raw_lines[0][0].y_top
+    for line in raw_lines[1:]:
+        cur_y = line[0].y_top
+        if prev_y - cur_y <= Y_BLOCK_TOL:
+            blocks[-1].extend(line)
+        else:
+            blocks.append(list(line))
+        prev_y = cur_y
+    return blocks
+
+
+# x_left tolerance for merging atoms into one vertical strip. Multi-line
+# table cells (CAS scheme names, ISIN+UCC stacks) all share an identical
+# x_left per text-show op; 3pt absorbs any sub-pixel jitter.
+X_LEFT_TOL = 3.0
+
+# Top-to-top y-gap allowed for vertical strip continuation. Within-cell
+# stacking is ~7pt in NSDL/CDSL tables; 9pt admits that without bridging
+# to the next row's atoms (which sit ~11pt below).
+STRIP_VERTICAL_GAP = 9.0
+
+
+# Two atoms in mid-table columns are merged into one vertical strip
+# only if their *left edges* match within `X_LEFT_TOL` AND their
+# *centres* drift apart by more than `CENTER_LEFT_ALIGN_TOL`. That
+# second condition tells left-aligned multi-line cells (right edges
+# wander with text width → centres drift) apart from centre-aligned
+# multi-row column headers (e.g., CDSL "Average Total" stacked over
+# "Expense Ratio" — both centred on the same column anchor → centres
+# nearly identical, should NOT collapse into one cell).
+#
+# Atoms at the leftmost column of the page are exempt from the
+# centre test: in CAS tables, column-1 stacking (ISIN+UCC, equity
+# ticker+name) is always a multi-line cell, never a centre-aligned
+# header. `LEFT_EDGE_X` is the cutoff x_left below which we trust the
+# x_left match alone.
+CENTER_LEFT_ALIGN_TOL = 1.0
+LEFT_EDGE_X = 100.0
+
+
+def _column_cluster(block_atoms: List[Atom]) -> List[List[Atom]]:
+    """Group atoms within one block into vertical strips (multi-line
+    *cells*). See module-level comments on the alignment heuristic.
+
+    Why not x-range overlap? Some CAS PDFs render the UCC of an MF
+    holding as a tiny single-digit text-show op (`'8'`) placed at the
+    *units* column's x-position rather than under the ISIN. An overlap-
+    based clusterer would absorb that `8` into the units cell and the
+    NSDL_MF_HOLDINGS_RE regex would fail. PyMuPDF treats this lone `8`
+    as its own block because it shares no left-aligned vertical
+    neighbour at its x_left; we replicate that here. PROD's
+    `extract_blocks` then emits it between `89,935.20` and `27.7978`
+    as a separate `\\t\\t` cell — the regex matches with the UCC stuffed
+    into the `folio` group, which is the same (admittedly imperfect)
+    behaviour as production.
+    """
+    strips: List[List[Atom]] = []
+    for a in sorted(block_atoms, key=lambda x: (-x.y_top, x.x_left)):
+        placed = False
+        a_center = (a.x_left + a.x_right) / 2
+        for strip in strips:
+            last = strip[-1]
+            x_left_ok = abs(a.x_left - last.x_left) <= X_LEFT_TOL
+            y_ok = -0.1 <= last.y_top - a.y_top <= STRIP_VERTICAL_GAP
+            if not (x_left_ok and y_ok):
+                continue
+            # Left-edge column: trust x_left match. Mid-table columns:
+            # also require centre drift so centre-aligned headers don't
+            # collapse into a single cell.
+            at_left_edge = a.x_left < LEFT_EDGE_X
+            last_center = (last.x_left + last.x_right) / 2
+            center_drifts = abs(a_center - last_center) > CENTER_LEFT_ALIGN_TOL
+            if at_left_edge or center_drifts:
+                strip.append(a)
+                placed = True
+                break
+        if not placed:
+            strips.append([a])
+    return strips
+
+
+# --- Structured block API for dedicated NSDL/CDSL parsers ---
+
+
+@dataclass
+class Cell:
+    """A logical table cell — one column slice of a block. May span
+    multiple lines vertically (e.g., a multi-line scheme name)."""
+
+    x_left: float
+    x_right: float
+    y_top: float
+    y_bot: float
+    text: str  # multi-line cells use `\\n` internally
+    atoms: List[Atom]  # the underlying text-show ops, for debugging
+
+
+@dataclass
+class Block:
+    """A logical row block. Cells are sorted left→right by x_left."""
+
+    page: int  # 1-indexed page number
+    cells: List[Cell]
+
+    @property
+    def y_top(self) -> float:
+        return max((c.y_top for c in self.cells), default=0.0)
+
+    @property
+    def y_bot(self) -> float:
+        return min((c.y_bot for c in self.cells), default=0.0)
+
+    @property
+    def x_left(self) -> float:
+        return min((c.x_left for c in self.cells), default=0.0)
+
+    @property
+    def x_right(self) -> float:
+        return max((c.x_right for c in self.cells), default=0.0)
+
+    def text(self) -> str:
+        """Lossy single-string view (cells joined by `\\t\\t`)."""
+        return "\t\t".join(c.text for c in self.cells if c.text)
+
+
+def _cells_from_block_atoms(block_atoms: List[Atom]) -> List[Cell]:
+    """Run column-cluster and return `Cell` objects with bbox metadata.
+
+    Text-show ops in adjacent columns (e.g., NSDL MF Holdings' folio
+    `9013692 ` and units `1,11,359.0` separated by only 5.3pt) stay
+    in their own cells so x-based column assignment can route them
+    correctly.
+    """
+    strips = _column_cluster(block_atoms)
+    strips.sort(key=lambda c: min(a.x_left for a in c))
+    cells: List[Cell] = []
+    for strip in strips:
+        sorted_strip = sorted(strip, key=lambda a: (-a.y_top, a.x_left))
+        joined = "\n".join(a.text.strip() for a in sorted_strip if a.text.strip())
+        if not joined:
+            continue
+        cells.append(
+            Cell(
+                x_left=min(a.x_left for a in strip),
+                x_right=max(a.x_right for a in strip),
+                y_top=max(a.y_top for a in strip),
+                y_bot=min(a.y_bot for a in strip),
+                text=joined,
+                atoms=sorted_strip,
+            )
+        )
+    return cells
+
+
+def blocks_from_atoms(pages: List[List[Atom]]) -> List[Block]:
+    """Convert pre-extracted atoms into `Block`s. Lets a single
+    `extract_atoms` call feed both the holdings parser and the
+    investor extractor in one go (NSDL/CDSL)."""
+    out: List[Block] = []
+    for page_num, atoms in enumerate(pages, start=1):
+        raw_lines = _cluster_raw_lines(atoms)
+        atom_blocks = _cluster_blocks(raw_lines)
+        for block_atoms in atom_blocks:
+            cells = _cells_from_block_atoms(block_atoms)
+            if cells:
+                out.append(Block(page=page_num, cells=cells))
+    return out
+
+
+def extract_blocks(
+    pdf_path: str,
+    password: str,
+    *,
+    _doc: "Optional[pdfium.PdfDocument]" = None,
+    _atoms: "Optional[List[List[Atom]]]" = None,
+) -> List[Block]:
+    """Return a flat list of `Block`s across all pages, in reading
+    order (top-down per page, pages in document order). Entry point
+    that dedicated NSDL/CDSL parsers consume.
+
+    When `_atoms` is provided, skip re-extracting; the dispatcher
+    extracts atoms once and feeds both the parser and the investor
+    extractor.
+    """
+    pages = _atoms if _atoms is not None else extract_atoms(pdf_path, password, _doc=_doc)
+    return blocks_from_atoms(pages)
diff --git a/casparser/parsers/pdfminer.py b/casparser/parsers/pdfminer.py
deleted file mode 100644
index 5a1f5e3..0000000
--- a/casparser/parsers/pdfminer.py
+++ /dev/null
@@ -1,263 +0,0 @@
-import io
-import re
-from typing import Iterator, List, Optional, Union
-
-from pdfminer.converter import PDFPageAggregator
-from pdfminer.layout import (
-    LAParams,
-    LTChar,
-    LTContainer,
-    LTTextBox,
-    LTTextBoxHorizontal,
-    LTTextBoxVertical,
-)
-from pdfminer.pdfdocument import PDFDocument, PDFPasswordIncorrect, PDFSyntaxError
-from pdfminer.pdfinterp import PDFPageInterpreter, PDFResourceManager
-from pdfminer.pdfpage import PDFPage
-from pdfminer.pdfparser import PDFParser
-
-from casparser.enums import FileType
-from casparser.exceptions import CASParseError, IncorrectPasswordError
-from casparser.types import InvestorInfo, PartialCASData
-
-from .utils import is_close
-
-# def parse_investor_info_nsdl(layout, width, height) -> InvestorInfo:
-#     """Parse investor info."""
-#     text_elements = sorted(
-#         [
-#             x
-#             for x in layout
-#             if isinstance(x, LTTextBoxHorizontal)
-#             # and x.x1 < width / 2
-#             # and x.y1 > height / 2
-#             and x.get_text().strip() != ""
-#         ],
-#         key=lambda x: -x.y1,
-#     )
-#     cas_id_found = False
-#     address_lines = []
-#     email = ""
-#     mobile = None
-#     name = None
-#     for el in text_elements:
-#         txt = el.get_text().strip()
-#         if not cas_id_found:
-#             if m := re.search(r"[CAS|NSDL]\s+ID\s*:\s*(.+?)(?:\s|$)", txt, re.I):
-#                 # email = m.group(1).strip()
-#                 cas_id_found = True
-#             continue
-#         if name is None:
-#             name = txt
-#         else:
-#             if (
-#                 re.search(
-#                     r"Statement\s+for\s+the\s+period|Your\s+demat\s+"
-#                     r"account\s+and\s+mutual\s+fund",
-#                     txt,
-#                     re.I | re.MULTILINE,
-#                 )
-#                 or mobile is not None
-#             ):
-#                 return InvestorInfo(
-#                     email=email, name=name, mobile=mobile or "", address="\n".join(address_lines)
-#                 )
-#             elif m := re.search(r"mobile\s*:\s*([+\d]+)(?:s|$)", txt, re.I):
-#                 mobile = m.group(1).strip()
-#             address_lines.append(txt)
-#     raise CASParseError("Unable to parse investor data")
-
-
-def parse_investor_info_mf(layout, width, height) -> InvestorInfo:
-    """Parse investor info."""
-    text_elements = sorted(
-        [
-            x
-            for x in layout
-            if isinstance(x, LTTextBoxHorizontal)
-            and x.x1 < width / 1.5
-            and x.y1 > height / 2
-            and x.get_text().strip() != ""
-        ],
-        key=lambda x: -x.y1,
-    )
-    email_found = False
-    address_lines = []
-    email = None
-    mobile = None
-    name = None
-    for el in text_elements:
-        txt = el.get_text().strip()
-        if not email_found:
-            if m := re.search(r"^\s*email\s+id\s*:\s*(.+?)(?:\s|$)", txt, re.I):
-                email = m.group(1).strip()
-                email_found = True
-            continue
-        if name is None:
-            name = txt
-        else:
-            if (
-                re.search(
-                    r"Portfolio\s+Summary|Mutual\s+Fund|Date\s+Transaction|Folio\s+No|^Date\s*$",
-                    txt,
-                    re.I | re.MULTILINE,
-                )
-                or mobile is not None
-            ):
-                return InvestorInfo(
-                    email=email, name=name, mobile=mobile or "", address="\n".join(address_lines)
-                )
-            elif m := re.search(r"mobile\s*:\s*([+\d]+)(?:s|$)", txt, re.I):
-                mobile = m.group(1).strip()
-            address_lines.append(txt)
-    raise CASParseError("Unable to parse investor data")
-
-
-def detect_pdf_source(document) -> FileType:
-    """
-    Try to infer pdf source (CAMS/KFINTECH) from the pdf metadata.
-
-    :param document: PDF document object
-    :return: FileType
-    """
-    file_type = FileType.UNKNOWN
-    for info in document.info:
-        producer = info.get("Producer", b"").decode("utf8", "ignore").replace("\x00", "")
-        if "Data Dynamics ActiveReports" in producer:
-            file_type = FileType.KFINTECH
-        elif "Stimulsoft Reports" in producer:
-            file_type = FileType.CAMS
-        if file_type != FileType.UNKNOWN:
-            break
-    return file_type
-
-
-def group_similar_rows(elements_list: List[Iterator[LTTextBoxHorizontal]]):
-    """
-    Group `LTTextBoxHorizontal` elements having similar rows, with a tolerance.
-
-    :param elements_list: List of elements from each page
-    """
-    lines = []
-    for elements in elements_list:
-        sorted_elements = list(sorted(elements, key=lambda x: (-x.y1, x.x0)))
-        y0, y1 = 0, 0
-        if len(sorted_elements) > 0:
-            y0, y1 = sorted_elements[0].y0, sorted_elements[0].y1
-        items = []
-        for el in sorted_elements:
-            if len(items) > 0 and not (
-                is_close(el.y1, y1, tol=5)
-                or is_close(el.y0, y0, tol=5)
-                or is_close(el.y1, y0, tol=2)
-                or is_close(el.y0, y1, tol=2)
-            ):
-                line = "\t\t".join(
-                    [x.get_text().strip() for x in sorted(items, key=lambda x: x.x0)]
-                )
-                if line.strip():
-                    lines.append(line)
-                items = []
-                y0, y1 = el.y0, el.y1
-            items.append(el)
-        if len(items) > 0:
-            line = "\t\t".join([x.get_text().strip() for x in sorted(items, key=lambda x: x.x0)])
-            if line.strip():
-                lines.append(line)
-    return lines
-
-
-def cas_pdf_to_text(filename: Union[str, io.IOBase], password) -> PartialCASData:
-    """
-    Parse CAS pdf and returns line data.
-
-    :param filename: CAS pdf file (CAMS or Kfintech)
-    :param password: CAS pdf password
-    :return: array of lines from the CAS.
-    """
-    file_type: Optional[FileType] = None
-
-    if isinstance(filename, str):
-        fp = open(filename, "rb")
-    elif hasattr(filename, "read") and hasattr(filename, "close"):  # file-like object
-        fp = filename
-    else:
-        raise CASParseError("Invalid input. filename should be a string or a file like object")
-
-    with fp:
-        pdf_parser = PDFParser(fp)
-        try:
-            document = PDFDocument(pdf_parser, password=password)
-        except PDFPasswordIncorrect:
-            raise IncorrectPasswordError("Incorrect PDF password!")
-        except PDFSyntaxError:
-            raise CASParseError("Unhandled error while opening file")
-
-        line_margin = {FileType.KFINTECH: 0.1, FileType.CAMS: 0.2}.get(
-            detect_pdf_source(document), 0.01
-        )
-
-        rsrc_mgr = PDFResourceManager()
-        laparams = LAParams(line_margin=line_margin, detect_vertical=True, all_texts=True)
-        device = PDFPageAggregator(rsrc_mgr, laparams=laparams)
-        interpreter = PDFPageInterpreter(rsrc_mgr, device)
-
-        pages: List[Iterator[LTTextBoxHorizontal]] = []
-
-        investor_info = None
-
-        def remove_non_english_text(textbox: LTContainer):
-            textbox._objs = [
-                obj
-                for obj in textbox._objs
-                if not (isinstance(obj, LTChar) and "Mangal" in obj.fontname)
-            ]
-            for i, obj in enumerate(textbox._objs):
-                if isinstance(obj, LTContainer):
-                    textbox._objs[i] = remove_non_english_text(obj)
-            return textbox
-
-        def extract_text_elements(layout: LTContainer) -> Iterator[LTTextBox]:
-            els = []
-            for el in layout:
-                if isinstance(el, LTTextBox):
-                    els.append(remove_non_english_text(el))
-                elif isinstance(el, LTContainer):
-                    els.extend(extract_text_elements(el))
-            return els
-
-        for page_num, page in enumerate(PDFPage.create_pages(document)):
-            interpreter.process_page(page)
-            layout = device.get_result()
-            text_elements = extract_text_elements(layout)
-            if file_type is None:
-                for el in filter(lambda x: isinstance(x, LTTextBoxVertical), text_elements):
-                    if re.search("CAMSCASWS", el.get_text()):
-                        file_type = FileType.CAMS
-                        break
-                    if re.search("KFINCASWS", el.get_text()):
-                        file_type = FileType.KFINTECH
-                        break
-                else:
-                    for el in text_elements:
-                        if "NSDL Consolidated Account Statement" in el.get_text():
-                            file_type = FileType.NSDL
-                            break
-                        elif "Central Depository Services (India) Limited" in el.get_text():
-                            file_type = FileType.CDSL
-                            break
-            if file_type in (FileType.CDSL, FileType.NSDL):
-                raise CASParseError(
-                    "pdfminer does not support this file type. Install pymupdf dependency"
-                )
-            if investor_info is None:
-                if file_type in (FileType.CAMS, FileType.KFINTECH):
-                    investor_info = parse_investor_info_mf(text_elements, *page.mediabox[2:])
-            #     elif file_type in (FileType.NSDL, FileType.CDSL) and page_num == 1:
-            #         investor_info = parse_investor_info_nsdl(text_elements, *page.mediabox[2:])
-            # if file_type == FileType.NSDL and page_num == 0:
-            #     # Ignore first page. no useful data
-            #     continue
-            pages.append(text_elements)
-        lines = group_similar_rows(pages)
-        return PartialCASData(file_type=file_type, investor_info=investor_info, lines=lines)
diff --git a/casparser/process/__init__.py b/casparser/process/__init__.py
deleted file mode 100644
index 9372c23..0000000
--- a/casparser/process/__init__.py
+++ /dev/null
@@ -1,38 +0,0 @@
-import re
-
-from ..enums import CASFileType, FileType
-from ..exceptions import CASParseError
-from ..types import ProcessedCASData
-from .cas_detailed import process_detailed_text
-from .cas_summary import process_summary_text
-from .cdsl_statement import process_cdsl_text
-from .nsdl_statement import process_nsdl_text
-from .regex import CAS_TYPE_RE
-
-
-def detect_cas_type(text):
-    if m := re.search(CAS_TYPE_RE, text, re.DOTALL | re.MULTILINE | re.I):
-        match = m.group(1).lower().strip()
-        if match == "statement":
-            return CASFileType.DETAILED
-        elif match == "summary":
-            return CASFileType.SUMMARY
-    return CASFileType.UNKNOWN
-
-
-def process_cas_text(text, file_type: FileType = FileType.UNKNOWN) -> ProcessedCASData:
-    """
-    Process the text version of a CAS pdf and return the detailed summary.
-    :param text:
-    :return:
-    """
-    if file_type == FileType.NSDL:
-        return process_nsdl_text(text)
-    elif file_type == FileType.CDSL:
-        return process_cdsl_text(text)
-    cas_statement_type = detect_cas_type(text[:1000])
-    if cas_statement_type == CASFileType.DETAILED:
-        return process_detailed_text(text)
-    elif cas_statement_type == CASFileType.SUMMARY:
-        return process_summary_text(text)
-    raise CASParseError("Unknown CAS file type")
diff --git a/casparser/process/cas_detailed.py b/casparser/process/cas_detailed.py
deleted file mode 100644
index 87f2316..0000000
--- a/casparser/process/cas_detailed.py
+++ /dev/null
@@ -1,336 +0,0 @@
-import re
-from collections import namedtuple
-from decimal import Decimal
-from typing import Dict, Optional, Tuple
-
-from dateutil import parser as date_parser
-
-from casparser.enums import CASFileType, TransactionType
-from casparser.exceptions import CASParseError, HeaderParseError
-from casparser.types import (
-    Folio,
-    ProcessedCASData,
-    Scheme,
-    SchemeValuation,
-    StatementPeriod,
-    TransactionData,
-)
-
-from .regex import (
-    AMC_RE,
-    CLOSE_UNITS_RE,
-    COST_RE,
-    DESCRIPTION_TAIL_RE,
-    DETAILED_DATE_RE,
-    DIVIDEND_RE,
-    FOLIO_KV_RE,
-    FOLIO_RE,
-    NAV_RE,
-    NOMINEE_RE,
-    OPEN_UNITS_RE,
-    REGISTRAR_RE,
-    SCHEME_KV_RE,
-    SCHEME_RE,
-    TRANSACTION_RE1,
-    TRANSACTION_RE2,
-    TRANSACTION_RE3,
-    TRANSACTION_RE4,
-    VALUATION_RE,
-)
-from .utils import isin_search
-
-ParsedTransaction = namedtuple(
-    "ParsedTransaction", ("date", "description", "amount", "units", "nav", "balance")
-)
-
-
-def str_to_decimal(value: Optional[str]) -> Decimal:
-    if isinstance(value, str):
-        return Decimal(value.replace(",", "_").replace("(", "-"))
-
-
-def parse_header(text):
-    """
-    Parse CAS header data.
-    :param text: CAS text
-    """
-    if m := re.search(DETAILED_DATE_RE, text, re.DOTALL | re.MULTILINE | re.I):
-        return m.groupdict()
-    raise HeaderParseError("Error parsing CAS header")
-
-
-def get_transaction_type(
-    description: str, units: Optional[Decimal]
-) -> Tuple[TransactionType, Optional[Decimal]]:
-    """Get transaction type from the description text."""
-
-    dividend_rate = None
-    description = description.lower()
-    if div_match := re.search(DIVIDEND_RE, description, re.I | re.DOTALL):
-        reinvest_flag, dividend_str = div_match.groups()
-        dividend_rate = Decimal(dividend_str)
-        txn_type = (
-            TransactionType.DIVIDEND_REINVEST if reinvest_flag else TransactionType.DIVIDEND_PAYOUT
-        )
-    elif units is None:
-        if "stt" in description:
-            txn_type = TransactionType.STT_TAX
-        elif "stamp" in description:
-            txn_type = TransactionType.STAMP_DUTY_TAX
-        elif "tds" in description:
-            txn_type = TransactionType.TDS_TAX
-        else:
-            txn_type = TransactionType.MISC
-    elif units > 0:
-        if "switch" in description:
-            if "merger" in description:
-                txn_type = TransactionType.SWITCH_IN_MERGER
-            else:
-                txn_type = TransactionType.SWITCH_IN
-        elif "segregat" in description:
-            txn_type = TransactionType.SEGREGATION
-        elif (
-            "sip" in description
-            or "systematic" in description
-            or re.search("instal+ment", description, re.I)
-            or re.search("sys.+?invest", description, re.I | re.DOTALL)
-        ):
-            txn_type = TransactionType.PURCHASE_SIP
-        else:
-            txn_type = TransactionType.PURCHASE
-    elif units < 0:
-        if re.search(
-            r"reversal|rejection|dishonoured|mismatch|insufficient\s+balance", description, re.I
-        ):
-            txn_type = TransactionType.REVERSAL
-        elif "switch" in description:
-            if "merger" in description:
-                txn_type = TransactionType.SWITCH_OUT_MERGER
-            else:
-                txn_type = TransactionType.SWITCH_OUT
-        else:
-            txn_type = TransactionType.REDEMPTION
-    else:
-        print(
-            "Warning: Error identifying transaction. "
-            "Please report the issue with the transaction description"
-        )
-        print(f"Txn description: {description} :: Units: {units}")
-        txn_type = TransactionType.UNKNOWN
-
-    return txn_type, dividend_rate
-
-
-def get_parsed_scheme_name(scheme) -> str:
-    scheme = re.sub(r"\((formerly|erstwhile).+?\)", "", scheme, flags=re.I | re.DOTALL).strip()
-    scheme = re.sub(r"\((Demat|Non-Demat).*", "", scheme, flags=re.I | re.DOTALL).strip()
-    scheme = re.sub(r"\s+", " ", scheme).strip()
-    return re.sub(r"[^a-zA-Z0-9_)]+$", "", scheme).strip()
-
-
-def parse_transaction(line) -> Optional[ParsedTransaction]:
-    for regex in (TRANSACTION_RE1, TRANSACTION_RE2, TRANSACTION_RE3, TRANSACTION_RE4):
-        if m := re.search(regex, line, re.DOTALL | re.MULTILINE | re.I):
-            groups = m.groups()
-            date = description = amount = units = nav = balance = None
-            if groups.count(None) == 3:
-                # Tax entries
-                date, description, amount, *_ = groups
-            elif groups.count(None) == 2:
-                # Segregated Portfolio Entries
-                date, description, units, balance, *_ = groups
-            elif groups.count(None) == 1:
-                # Zero unit entries
-                date, description, amount, units, nav, balance = groups
-                units = "0.000"
-            elif groups.count(None) == 0:
-                # Normal entries
-                date, description, amount, units, nav, balance = groups
-            if date is not None:
-                # Tax-style entries (e.g. ``*** Stamp Duty ***``) only carry an
-                # amount; if a downstream column from a wrapped row got
-                # appended, the regex may misread it as units/balance.
-                if description and re.match(r"\s*\*\*\*", description):
-                    if amount is None and units is not None:
-                        amount = units
-                    units = None
-                    balance = None
-                return ParsedTransaction(date, description, amount, units, nav, balance)
-
-
-def process_detailed_text(text):
-    """
-    Process the text version of a CAS pdf and return the detailed summary.
-    :param text:
-    :return:
-    """
-    hdr_data = parse_header(text[:1000])
-    statement_period = StatementPeriod(from_=hdr_data["from"], to=hdr_data["to"])
-
-    folios: Dict[str, Folio] = {}
-    current_folio = None
-    current_amc = None
-    curr_scheme_data: Optional[Scheme] = None
-    lines = text.split("\u2029")
-    for idx, line in enumerate(lines):
-        # Parse schemes with long names (single line) effectively pushing
-        # "Registrar" column to the previous line
-        if re.search(REGISTRAR_RE, line):
-            line = "\t\t".join([lines[idx + 1], line])
-        # Some scheme rows have the registrar header at the end of the scheme
-        # line but the registrar value (e.g. "KFINTECH") on the following line.
-        elif idx + 1 < len(lines) and re.search(r"Registrar\s*:\s*$", line):
-            next_line = lines[idx + 1].strip()
-            # Two-column wrap: both the advisor value and the registrar value
-            # wrapped to the next visual row. The next line looks like
-            # ``<advisor>)\t\t<registrar>``. Splice the advisor into the
-            # ``(Advisor:`` slot and the registrar onto the end.
-            two_col = re.match(r"^([-\w]+)\)\s*\t+\s*(\S+)\s*$", next_line)
-            if two_col and re.search(r"\(Advisor\s*:\s*\t", line):
-                advisor_value, registrar_value = two_col.groups()
-                line = (
-                    re.sub(
-                        r"(\(Advisor\s*:\s*)",
-                        r"\1" + advisor_value + ")",
-                        line,
-                        count=1,
-                    )
-                    + registrar_value
-                )
-            else:
-                line = line + next_line
-        # Scheme name with advisor info wraps across visual rows; the advisor
-        # value (e.g. "WEALTH)") ends up on the next line.
-        elif (
-            idx + 1 < len(lines)
-            and re.search(r"\(Advisor\s*:\s*(?:\t|$)", line)
-            and re.match(r"^[-\w]+\)\s*$", lines[idx + 1].strip())
-        ):
-            advisor_value = lines[idx + 1].strip().rstrip(")")
-            line = re.sub(r"(\(Advisor\s*:\s*)", r"\1" + advisor_value + ")", line, count=1)
-        # Scheme name wraps and the wrapped continuation contains the ISIN /
-        # advisor info on the next visual row.
-        elif (
-            idx + 1 < len(lines)
-            and re.search(r"Registrar\s*:\s*\w+\s*$", line)
-            and re.search(r"^[-\w]+-", line)
-            and re.search(r"ISIN\s*:|\(Advisor\s*:", lines[idx + 1])
-        ):
-            line = line + " " + lines[idx + 1].strip()
-        if amc_match := re.search(AMC_RE, line, re.I | re.DOTALL):
-            current_amc = amc_match.group(0)
-        elif m := re.search(FOLIO_RE, line):
-            folio = m.group(1).strip()
-            if current_folio is None or current_folio != folio:
-                if curr_scheme_data and current_folio is not None:
-                    folios[current_folio].schemes.append(curr_scheme_data)
-                    curr_scheme_data = None
-                current_folio = folio
-
-                pan = ""
-                kyc = None
-                pankyc = None
-                for k, v in re.findall(FOLIO_KV_RE, line):
-                    v = v.strip()
-                    if k == "KYC":
-                        kyc = v
-                    elif len(v) == 10:
-                        pan = v
-                    else:
-                        pankyc = v
-
-                if folio not in folios:
-                    folios[folio] = Folio(
-                        folio=current_folio,
-                        amc=current_amc,
-                        PAN=pan,
-                        KYC=kyc,
-                        PANKYC=pankyc,
-                        schemes=[],
-                    )
-        elif m := re.search(SCHEME_RE, line, re.DOTALL | re.MULTILINE | re.I):
-            if current_folio is None:
-                raise CASParseError("Layout Error! Scheme found before folio entry.")
-            scheme = get_parsed_scheme_name(m.group("name"))
-            if curr_scheme_data is None or curr_scheme_data.scheme != scheme:
-                if curr_scheme_data:
-                    folios[current_folio].schemes.append(curr_scheme_data)
-
-            match_pairs = re.findall(SCHEME_KV_RE, line, re.DOTALL | re.MULTILINE | re.I)
-            metadata: Dict[str, str] = {}
-            for key, value in match_pairs:
-                metadata[key.strip().lower()] = value.strip()
-            isin_ = metadata.get("isin")
-            rta_code = m.group("code").strip()
-            rta = m.group("rta").strip()
-            isin, amfi, scheme_type = isin_search(scheme, rta, rta_code, isin=isin_)
-            curr_scheme_data = Scheme(
-                scheme=scheme,
-                advisor=metadata.get("advisor"),
-                rta=rta,
-                rta_code=rta_code,
-                isin=isin,
-                type=scheme_type or "N/A",
-                amfi=amfi,
-                open=Decimal(0.0),
-                close=Decimal(0.0),
-                close_calculated=Decimal(0.0),
-                valuation=SchemeValuation(
-                    date=statement_period.to, value=Decimal(0.0), nav=Decimal(0.0)
-                ),
-                transactions=[],
-            )
-        if not curr_scheme_data:
-            continue
-        if m := re.search(NOMINEE_RE, line, re.I | re.DOTALL):
-            curr_scheme_data.nominees.extend([x.strip() for x in m.groups() if x.strip()])
-        if m := re.search(OPEN_UNITS_RE, line):
-            curr_scheme_data.open = Decimal(m.group(1).replace(",", "_"))
-            curr_scheme_data.close_calculated = curr_scheme_data.open
-            continue
-        if m := re.search(CLOSE_UNITS_RE, line):
-            curr_scheme_data.close = Decimal(m.group(1).replace(",", "_"))
-        if m := re.search(COST_RE, line, re.I):
-            curr_scheme_data.valuation.cost = Decimal(m.group(1).replace(",", "_"))
-        if m := re.search(VALUATION_RE, line, re.I):
-            curr_scheme_data.valuation.date = date_parser.parse(m.group(1)).date()
-            curr_scheme_data.valuation.value = Decimal(m.group(2).replace(",", "_"))
-        if m := re.search(NAV_RE, line, re.I):
-            curr_scheme_data.valuation.date = date_parser.parse(m.group(1)).date()
-            curr_scheme_data.valuation.nav = Decimal(m.group(2).replace(",", "_"))
-            continue
-        description_tail = ""
-        if m := re.search(DESCRIPTION_TAIL_RE, line):
-            description_tail = m.group(1).strip()
-            line = line.replace(m.group(1), "")
-        if parsed_txn := parse_transaction(line):
-            date = date_parser.parse(parsed_txn.date).date()
-            desc = parsed_txn.description.strip()
-            if description_tail != "":
-                desc = " ".join([desc, description_tail])
-            amt = str_to_decimal(parsed_txn.amount)
-            units = str_to_decimal(parsed_txn.units)
-            nav = str_to_decimal(parsed_txn.nav)
-            balance = str_to_decimal(parsed_txn.balance)
-            txn_type, dividend_rate = get_transaction_type(desc, units)
-            if units is not None:
-                curr_scheme_data.close_calculated += units
-            curr_scheme_data.transactions.append(
-                TransactionData(
-                    date=date,
-                    description=desc,
-                    amount=amt,
-                    units=units,
-                    nav=nav,
-                    balance=balance,
-                    type=txn_type.name,
-                    dividend_rate=dividend_rate,
-                )
-            )
-    if curr_scheme_data:
-        folios[current_folio].schemes.append(curr_scheme_data)
-    return ProcessedCASData(
-        cas_type=CASFileType.DETAILED,
-        statement_period=statement_period,
-        folios=list(folios.values()),
-    )
diff --git a/casparser/process/cas_summary.py b/casparser/process/cas_summary.py
deleted file mode 100644
index 73bb0a5..0000000
--- a/casparser/process/cas_summary.py
+++ /dev/null
@@ -1,98 +0,0 @@
-import re
-from decimal import Decimal
-
-from dateutil import parser as date_parser
-
-from casparser.enums import CASFileType
-from casparser.exceptions import HeaderParseError
-from casparser.types import (
-    Folio,
-    ProcessedCASData,
-    Scheme,
-    SchemeValuation,
-    StatementPeriod,
-)
-
-from .regex import SCHEME_TAIL_RE, SUMMARY_DATE_RE, SUMMARY_ROW_RE
-from .utils import isin_search
-
-
-def parse_header(text):
-    """
-    Parse CAS header data.
-    :param text: CAS text
-    """
-    if m := re.search(SUMMARY_DATE_RE, text, re.DOTALL | re.MULTILINE | re.I):
-        return m.groupdict()
-    raise HeaderParseError("Error parsing CAS header")
-
-
-def process_summary_text(text):
-    """
-    Process the text version of a CAS pdf and return the detailed summary.
-    :param text:
-    :return:
-    """
-    hdr_data = parse_header(text[:1000])
-    statement_period = StatementPeriod(from_=hdr_data["date"], to=hdr_data["date"])
-
-    folios = {}
-    current_folio = None
-    current_amc = "N/A"
-    lines = text.split("\u2029")
-    for line in lines:
-        if len(folios) > 0 and re.search("Total", line, re.I):
-            break
-        scheme_tails = []
-        if m := re.findall(SCHEME_TAIL_RE, line):
-            for txt in m:
-                line = line.replace(txt, "")
-                scheme_tails.append(re.sub(r"\s+", " ", txt).strip())
-        if m := re.search(SUMMARY_ROW_RE, line, re.DOTALL | re.MULTILINE | re.I):
-            folio = m.group("folio").strip()
-            if current_folio is None or current_folio != folio:
-                current_folio = folio
-                if folio not in folios:
-                    folios[folio] = Folio(
-                        folio=current_folio,
-                        amc=current_amc,
-                        PAN="N/A",
-                        KYC="N/A",
-                        PANKYC="N/A",
-                        schemes=[],
-                    )
-            scheme = m.group("name")
-            if len(scheme_tails) > 0:
-                scheme = " ".join([scheme, *scheme_tails])
-            scheme = re.sub(r"\(formerly.+?\)", "", scheme, flags=re.I | re.DOTALL).strip()
-            rta = m.group("rta").strip()
-            rta_code = m.group("code").strip()
-            isin_ = m.group("isin")
-            isin, amfi, scheme_type = isin_search(scheme, rta, rta_code, isin=isin_)
-            scheme_data = Scheme(
-                scheme=scheme,
-                advisor="N/A",
-                rta_code=rta_code,
-                rta=rta,
-                isin=isin,
-                amfi=amfi,
-                type=scheme_type or "N/A",
-                open=Decimal(m.group("balance").replace(",", "_")),
-                close=Decimal(m.group("balance").replace(",", "_")),
-                close_calculated=Decimal(m.group("balance").replace(",", "_")),
-                valuation=SchemeValuation(
-                    date=date_parser.parse(m.group("date")).date(),
-                    nav=Decimal(m.group("nav").replace(",", "_")),
-                    value=Decimal(m.group("value").replace(",", "_")),
-                ),
-                transactions=[],
-            )
-            cost = m.group("cost")
-            if cost is not None:
-                scheme_data.valuation.cost = Decimal(cost.replace(",", "_"))
-            folios[current_folio].schemes.append(scheme_data)
-    return ProcessedCASData(
-        cas_type=CASFileType.SUMMARY,
-        statement_period=statement_period,
-        folios=list(folios.values()),
-    )
diff --git a/casparser/process/cdsl_statement.py b/casparser/process/cdsl_statement.py
deleted file mode 100644
index b964341..0000000
--- a/casparser/process/cdsl_statement.py
+++ /dev/null
@@ -1,301 +0,0 @@
-import re
-from decimal import Decimal
-
-from casparser.exceptions import HeaderParseError
-from casparser.types import (
-    DematAccount,
-    DematOwner,
-    Equity,
-    MutualFund,
-    NSDLCASData,
-    StatementPeriod,
-)
-
-from .regex import DEMAT_STATEMENT_PERIOD_RE
-
-CDSL_DP_ID_RE = (
-    r"DP\s*Name\s*:\s*(.+?)\s*DP\s*ID\s*:\s*(\d+)\s*CLIENT\s*ID\s*:\s*(\d+)"
-)
-
-CDSL_DP_NAME_BOID_RE = (
-    r"DP\s*Name\s*:\s*(.+?)\s*BO\s*ID\s*:\s*(\d+)"
-)
-
-DEMAT_HOLDINGS_HEADER_RE = r"HOLDING\s+STATEMENT"
-
-ISIN_LINE_RE = r"^(?P<isin>[A-Z]{2}[0-9A-Z]{9}\d)"
-
-_PAGE_SKIP_RE = re.compile(
-    r"^(?:Page\s+\d+\s+of\s+\d+|Central\s+Depository|CONSOLIDATED\s+ACCOUNT"
-    r"|FORM\s+AND\s+INVESTMENTS|Investments|A\s+Wing|Lower\s+Parel)",
-    re.I,
-)
-
-_PAGE_HEADER_SKIP_RE = re.compile(
-    r"^(?:RATAN\s+KUMAR|(?:ISIN|Security)\t|Account\s+Type|"
-    r"TER\s+&\s+COMMISSION|YOUR\s+CONSOLIDATED|TER\s+&|Portfolio\s+Value)",
-    re.I,
-)
-
-
-def parse_decimal(value):
-    if isinstance(value, str):
-        value = value.replace(",", "")
-        if value in ("--", "", "0", "N.A"):
-            return Decimal("0")
-        return Decimal(value)
-    return Decimal(str(value)) if value is not None else Decimal("0")
-
-
-def parse_header(text):
-    if m := re.search(
-        DEMAT_STATEMENT_PERIOD_RE,
-        text,
-        re.DOTALL | re.MULTILINE | re.I,
-    ):
-        return m.groupdict()
-    raise HeaderParseError("Error parsing CAS header")
-
-
-def _is_numeric_token(token):
-    return bool(re.match(r"^[\d,]+\.?\d*$|^--$", token))
-
-
-def _split_name_numeric(parts):
-    name_parts = []
-    numeric_parts = []
-    for p in parts:
-        p = p.strip()
-        if not p:
-            continue
-        if _is_numeric_token(p):
-            numeric_parts.append(p)
-        else:
-            name_parts.append(p)
-    return name_parts, numeric_parts
-
-
-def process_cdsl_text(text):
-    hdr_data = parse_header(text)
-    statement_period = StatementPeriod(from_=hdr_data["from"], to=hdr_data["to"])
-
-    lines = text.split("\u2029")
-
-    dp_info_map = {}
-    for line in lines:
-        if m := re.search(CDSL_DP_ID_RE, line, re.I):
-            dp_name, dp_id, client_id = m.groups()
-            dp_name_clean = dp_name.strip()
-            dp_info_map[dp_name_clean] = {
-                "name": dp_name_clean,
-                "dp_id": dp_id,
-                "client_id": client_id,
-            }
-
-    demat_accounts = {}
-    for dp_name, info in dp_info_map.items():
-        key = (info["dp_id"], info["client_id"])
-        demat_accounts[key] = {
-            "name": dp_name,
-            "type": "CDSL Demat Account",
-            "dp_id": info["dp_id"],
-            "client_id": info["client_id"],
-            "folios": 0,
-            "balance": Decimal("0"),
-            "owners": [],
-            "equities": [],
-            "mutual_funds": [],
-        }
-
-    dp_name_to_key = {}
-    for key, acct in demat_accounts.items():
-        dp_name_to_key[acct["name"].upper()] = key
-
-    current_account_key = None
-    in_holdings = False
-    in_mf_holdings = False
-    mf_scheme_name_lines = []
-    mf_folio_holdings = []
-
-    for idx, line in enumerate(lines):
-        stripped = line.strip()
-
-        if not stripped:
-            continue
-
-        if _PAGE_SKIP_RE.match(stripped):
-            continue
-
-        if re.search(r"MUTUAL\s+FUND\s+UNITS\s+HELD\s+WITH\s+MF", stripped, re.I):
-            in_mf_holdings = True
-            in_holdings = False
-            mf_scheme_name_lines = []
-            continue
-
-        if in_mf_holdings:
-            if re.search(r"MUTUAL\s+FUND\s+UNITS\s+HELD\s+AS\s+ON",
-                         stripped, re.I):
-                mf_scheme_name_lines = []
-                continue
-            if re.search(r"Grand\s+Total|Average\s+Total\s+Expense|Load\s+Structures|"
-                         r"Statement\s+for\s+the\s+period|IDCW|Notes|About\s+CDSL",
-                         stripped, re.I):
-                in_mf_holdings = False
-                continue
-            if _PAGE_HEADER_SKIP_RE.match(stripped):
-                continue
-            if re.search(r"Scheme\s+Name|^ISIN\b|Date\s+Transaction|Opening\s+Balance|"
-                         r"Closing\s+Balance|Transaction\s+Description|Folio\s+No",
-                         stripped, re.I):
-                continue
-            if re.search(r"(?:AMC|Mutual\s+Fund)\s*$", stripped, re.I) and not re.match(
-                ISIN_LINE_RE, line
-            ):
-                continue
-
-            has_isin = re.search(r"INF[A-Z0-9]{8}\d", line)
-            if not has_isin:
-                continue
-
-            parts = line.split("\t\t")
-            stripped_parts = [p.strip() for p in parts if p.strip()]
-
-            isin = ""
-            scheme_name_parts = []
-            folio = ""
-            numeric_fields = []
-            found_isin = False
-
-            for p in stripped_parts:
-                if re.match(r"^INF[A-Z0-9]{8}\d$", p):
-                    isin = p
-                    found_isin = True
-                    continue
-                if not found_isin:
-                    scheme_name_parts.append(p)
-                    continue
-                if not folio and p not in ("DIRECT", "") and not p.startswith("ARN"):
-                    folio = p
-                    continue
-                if _is_numeric_token(p):
-                    numeric_fields.append(p)
-
-            scheme_name = " ".join(scheme_name_parts)
-            scheme_name = re.sub(r"\s+", " ", scheme_name).strip()
-
-            closing_bal = Decimal("0")
-            nav = Decimal("0")
-            valuation = Decimal("0")
-
-            if len(numeric_fields) >= 4:
-                closing_bal = parse_decimal(numeric_fields[0])
-                nav = parse_decimal(numeric_fields[1])
-                valuation = parse_decimal(numeric_fields[3])
-
-            mf_folio_holdings.append({
-                "isin": isin,
-                "name": scheme_name,
-                "balance": str(closing_bal),
-                "nav": str(nav),
-                "value": str(valuation),
-            })
-
-            continue
-
-        if re.search(CDSL_DP_NAME_BOID_RE, line, re.I):
-            in_holdings = False
-            m = re.search(CDSL_DP_NAME_BOID_RE, line, re.I)
-            dp_name = m.group(1).strip().upper()
-            current_account_key = dp_name_to_key.get(dp_name)
-            continue
-
-        if re.search(DEMAT_HOLDINGS_HEADER_RE, stripped, re.I):
-            in_holdings = True
-            continue
-
-        if not in_holdings or current_account_key is None:
-            continue
-
-        if re.search(r"Portfolio\s+Value\s+`", stripped, re.I):
-            in_holdings = False
-            continue
-
-        if _PAGE_HEADER_SKIP_RE.match(stripped):
-            continue
-
-        if m := re.match(ISIN_LINE_RE, line):
-            isin = m.group("isin")
-            is_mf = isin.startswith("INF")
-            parts = line.split("\t\t")
-            name_parts, numeric_parts = _split_name_numeric(parts[1:])
-            name = re.sub(r"\s+", " ", " ".join(name_parts)).strip()
-
-            if len(numeric_parts) >= 2:
-                price = parse_decimal(numeric_parts[-2]) if len(numeric_parts) >= 3 else Decimal("0")
-                value = parse_decimal(numeric_parts[-1])
-                if price != 0:
-                    balance = round(value / price, 3)
-                else:
-                    balance = parse_decimal(numeric_parts[-3]) if len(numeric_parts) >= 3 else Decimal("0")
-            else:
-                continue
-
-            if is_mf:
-                demat_accounts[current_account_key]["mutual_funds"].append({
-                    "isin": isin,
-                    "name": name,
-                    "balance": str(balance),
-                    "nav": str(price),
-                    "value": str(value),
-                })
-            else:
-                demat_accounts[current_account_key]["equities"].append({
-                    "isin": isin,
-                    "name": name,
-                    "num_shares": str(balance),
-                    "price": str(price),
-                    "value": str(value),
-                })
-
-    account_objects = []
-    for key, acct_data in demat_accounts.items():
-        equities = [Equity(**e) for e in acct_data["equities"]]
-        mutual_funds = [MutualFund(**m) for m in acct_data["mutual_funds"]]
-
-        total_value = sum(
-            (Decimal(e["value"]) for e in acct_data["equities"])
-        ) + sum(
-            (Decimal(m["value"]) for m in acct_data["mutual_funds"])
-        )
-
-        account_objects.append(DematAccount(
-            name=acct_data["name"],
-            type=acct_data["type"],
-            dp_id=acct_data["dp_id"],
-            client_id=acct_data["client_id"],
-            folios=len(equities) + len(mutual_funds),
-            balance=total_value,
-            owners=[],
-            equities=equities,
-            mutual_funds=mutual_funds,
-        ))
-
-    if mf_folio_holdings:
-        mf_list = [MutualFund(**m) for m in mf_folio_holdings]
-        mf_total = sum(Decimal(m["value"]) for m in mf_folio_holdings)
-        account_objects.append(DematAccount(
-            name="Mutual Fund Folios",
-            type="MF",
-            dp_id="",
-            client_id="",
-            folios=len(mf_folio_holdings),
-            balance=mf_total,
-            owners=[],
-            equities=[],
-            mutual_funds=mf_list,
-        ))
-
-    return NSDLCASData(
-        statement_period=statement_period,
-        accounts=account_objects,
-    )
diff --git a/casparser/process/nsdl_statement.py b/casparser/process/nsdl_statement.py
deleted file mode 100644
index 7e1b36a..0000000
--- a/casparser/process/nsdl_statement.py
+++ /dev/null
@@ -1,213 +0,0 @@
-import re
-
-from casparser_isin import ISINDb
-
-from casparser.exceptions import HeaderParseError
-from casparser.types import NSDLCASData, StatementPeriod
-
-from .regex import (
-    DEMAT_AC_HOLDER_RE,
-    DEMAT_AC_TYPE_RE,
-    DEMAT_DP_ID_RE,
-    DEMAT_HEADER_RE,
-    DEMAT_MF_HEADER_RE,
-    DEMAT_MF_TYPE_RE,
-    DEMAT_STATEMENT_PERIOD_RE,
-    NSDL_CDSL_HOLDINGS_RE,
-    NSDL_EQ_RE,
-    NSDL_MF_HOLDINGS_RE,
-    NSDL_MF_RE,
-)
-
-
-def parse_header(text):
-    """
-    Parse CAS header data.
-    :param text: CAS text
-    """
-    if m := re.search(
-        DEMAT_STATEMENT_PERIOD_RE,
-        text,
-        re.DOTALL | re.MULTILINE | re.I,
-    ):
-        return m.groupdict()
-    raise HeaderParseError("Error parsing CAS header")
-
-
-def process_nsdl_text(text):
-    hdr_data = parse_header(text)
-    statement_period = StatementPeriod(from_=hdr_data["from"], to=hdr_data["to"])
-    accounts = re.findall(
-        DEMAT_HEADER_RE,
-        text,
-        flags=re.I | re.MULTILINE,
-    )
-    mutual_funds = re.findall(
-        DEMAT_MF_HEADER_RE,
-        text,
-        flags=re.I | re.MULTILINE,
-    )
-    demat = {}
-    for account_type, account_name, dp_id, client_id, folios, balance in accounts:
-        demat[(dp_id, client_id)] = {
-            "name": account_name,
-            "folios": folios,
-            "balance": balance,
-            "type": account_type,
-            "dp_id": dp_id,
-            "client_id": client_id,
-            "owners": [],
-            "equities": [],
-            "mutual_funds": [],
-        }
-    for num_folios, _, balance in mutual_funds:
-        demat[(None, None)] = {
-            "name": "Mutual Fund Folios",
-            "folios": num_folios,
-            "balance": balance,
-            "type": "MF",
-            "dp_id": "",
-            "client_id": "",
-            "owners": [],
-            "equities": [],
-            "mutual_funds": [],
-        }
-
-    lines = text.split("\u2029")
-    start_processing_holdings = False
-    current_demat = None
-    demat_holders = []
-    for line in lines:
-        if m := re.search(DEMAT_AC_TYPE_RE, line, flags=re.I):
-            start_processing_holdings = True
-            current_demat = None
-        if not start_processing_holdings:
-            continue
-        if current_demat is None:
-            if m := re.search(DEMAT_MF_TYPE_RE, line.strip(), flags=re.I):
-                if (None, None) in demat:
-                    current_demat = demat[(None, None)]
-                else:
-                    continue
-
-            if "ACCOUNT HOLDER" in line.upper():
-                for owner, pan in re.findall(DEMAT_AC_HOLDER_RE, line, re.I):
-                    demat_holders.append(
-                        {
-                            "name": owner,
-                            "PAN": pan,
-                        }
-                    )
-
-            if m := re.search(
-                DEMAT_DP_ID_RE,
-                line,
-                flags=re.I | re.MULTILINE | re.DOTALL,
-            ):
-                dp_id, client_id = m.groups()
-                current_demat = demat[(dp_id, client_id)]
-                current_demat["owners"] = demat_holders.copy()
-                demat_holders = []
-            continue
-        if "NSDL" in current_demat["type"]:
-            if m := re.search(
-                NSDL_EQ_RE,
-                line,
-                re.DOTALL | re.MULTILINE | re.I,
-            ):
-                isin, _, face_value, num_shares, market_value, current_value = m.groups()
-                current_demat["equities"].append(
-                    {
-                        "isin": isin,
-                        # "face_value": face_value,
-                        "num_shares": num_shares,
-                        "price": market_value,
-                        "value": current_value,
-                    }
-                )
-                continue
-            elif m := re.search(
-                NSDL_MF_RE,
-                line,
-                re.DOTALL | re.MULTILINE | re.I,
-            ):
-                isin, name, balance, nav, value = m.groups()
-                current_demat["mutual_funds"].append(
-                    {
-                        "isin": isin,
-                        "name": name,
-                        "balance": balance,
-                        "nav": nav,
-                        "value": value,
-                    }
-                )
-                continue
-        elif "CDSL" in current_demat["type"]:
-            if m := re.search(
-                NSDL_CDSL_HOLDINGS_RE,
-                line,
-                re.DOTALL | re.MULTILINE | re.I,
-            ):
-                isin, name, balance, *_, nav, value = m.groups()
-                if isin.startswith("INF"):
-                    current_demat["mutual_funds"].append(
-                        {
-                            "isin": isin,
-                            "name": name,
-                            "balance": balance,
-                            "nav": nav,
-                            "value": value,
-                        }
-                    )
-                elif isin.startswith("INE"):
-                    current_demat["equities"].append(
-                        {
-                            "isin": isin,
-                            # "face_value": None,
-                            "num_shares": balance,
-                            "price": nav,
-                            "value": value,
-                        }
-                    )
-                continue
-        elif current_demat["type"] == "MF":
-            if m := re.search(
-                NSDL_MF_HOLDINGS_RE,
-                line,
-                re.DOTALL | re.MULTILINE | re.I,
-            ):
-                isin, ucc, name, folio, units, avg_cost, total_cost, nav, value, pnl, returns = (
-                    m.groups()
-                )
-                name = re.sub(r"\s+", " ", name).strip()
-                name = re.sub(r"[^a-zA-Z0-9_)]+$", "", name).strip()
-                current_demat["mutual_funds"].append(
-                    {
-                        "isin": isin,
-                        "ucc": ucc,
-                        "name": name,
-                        "folio": folio,
-                        "balance": units,
-                        "avg_cost": avg_cost,
-                        "total_cost": total_cost,
-                        "nav": nav,
-                        "value": value,
-                        "pnl": pnl,
-                        "return": returns,
-                    }
-                )
-
-    cas_data = NSDLCASData(
-        statement_period=statement_period,
-        accounts=list(demat.values()),
-    )
-
-    with ISINDb() as isin_db:
-        for account in cas_data.accounts:
-            for equity in account.equities:
-                if equity.name is None:
-                    isin_data = isin_db.isin_lookup(equity.isin)
-                    if isin_data:
-                        equity.name = isin_data.name
-
-    return cas_data
diff --git a/casparser/process/regex.py b/casparser/process/regex.py
deleted file mode 100644
index a6b71e6..0000000
--- a/casparser/process/regex.py
+++ /dev/null
@@ -1,77 +0,0 @@
-"""Regular expressions for parsing various sections in CAS."""
-
-date_re = r"(\d{2}-[A-Za-z]{3}-\d{4})"
-amt_re = r"([(-]*\d[\d,.]+)\)*"
-
-isin_re = r"[A-Z]{2}[0-9A-Z]{9}[0-9]{1}"
-
-CAS_TYPE_RE = r"consolidated\s+account\s+(statement|summary)"
-DETAILED_DATE_RE = r"(?P<from>\d{2}-[a-zA-Z]{3}-\d{4})\s+to\s+(?P<to>\d{2}-[a-zA-Z]{3}-\d{4})"
-SUMMARY_DATE_RE = r"as\s+on\s+(?P<date>\d{2}-[a-zA-Z]{3}-\d{4})"
-SUMMARY_ROW_RE = (
-    r"(?P<folio>[\d/\s]+?)(?P<isin>[A-Z]{2}[0-9A-Z]{9}[0-9]{1})?\s+(?P<code>[ \w]+)-"
-    r"(?P<name>.+?)\s+(?P<cost>[\d,.]+)?\s+(?P<balance>[\d,.]+)\t\t"
-    r"(?P<date>\d{2}-[A-Za-z]{3}-\d{4})\t\t(?P<nav>[\d,.]+)\t\t(?P<value>[\d,.]+)"
-    r"\t\t(?P<rta>\w+)\s*$"
-)
-SCHEME_TAIL_RE = r"(\n.+?)\t\t"
-
-AMC_RE = r"^(.+?\s+(MF|Mutual\s*Fund)|franklin\s+templeton\s+investments)$"
-FOLIO_RE = r"^Folio\s+No\s*:\s+([\d/\s]+\d)\s"
-FOLIO_KV_RE = r"(PAN|KYC)\s*:\s*([A-Z]{5}\d{4}[A-Z]|OK|NOT OK)"
-
-NOMINEE_RE = r"\s*Nominee\s+[1-3]\s*:\s*(.*?)" * 3 + r"$"
-
-SCHEME_RE = (
-    r"(?P<code>[\s\w]+-*[gdp]?)-\s*\d*\s*(?P<name>.+?)(?:\t\t|\(\s*Advis|ISIN).*?"
-    r"Registrar\s*:\s*(?P<rta>[^\s]*).*$"
-)
-SCHEME_KV_RE = r"""(\w+)\s*:\s*([-\w]+)"""
-
-REGISTRAR_RE = r"^\s*Registrar\s*:\s*(.*)\s*$"
-OPEN_UNITS_RE = r"Opening\s+Unit\s+Balance.+?([\d,.]+)"
-CLOSE_UNITS_RE = r"Closing\s+Unit\s+Balance.+?([\d,.]+)"
-COST_RE = r"Total\s+Cost\s+Value\s*:.+?[INR\s]*([\d,.]+)"
-VALUATION_RE = (
-    r"(?:Valuation|Market\s+Value)\s+on\s+(\d{2}-[A-Za-z]{3}-\d{4})\s*:\s*INR\s*([\d,.]+)"
-)
-NAV_RE = r"NAV\s+on\s+(\d{2}-[A-Za-z]{3}-\d{4})\s*:\s*INR\s*([\d,.]+)"
-
-# Normal Transaction entries
-TRANSACTION_RE1 = rf"{date_re}\t\t([^0-9].*)\t\t{amt_re}\t\t{amt_re}\t\t{amt_re}\t\t{amt_re}"
-# Zero unit transactions (ref: #88)
-TRANSACTION_RE2 = rf"{date_re}\t\t([^0-9].*)\t\t{amt_re}\t\t(?:{amt_re})*\t\t{amt_re}\t\t{amt_re}"
-# Segregated portfolio entries
-TRANSACTION_RE3 = rf"{date_re}\t\t([^0-9].*)\t\t{amt_re}\t\t{amt_re}(?:\t\t{amt_re}\t\t{amt_re})*"
-# Tax transactions
-TRANSACTION_RE4 = rf"{date_re}\t\t([^0-9].*)\t\t{amt_re}(?:\t\t{amt_re}\t\t{amt_re}\t\t{amt_re})*"
-DESCRIPTION_TAIL_RE = r"(\n.+?)(\t\t|$)"
-DIVIDEND_RE = r"(?:div\.|dividend|idcw).+?(reinvest)*.*?@\s*Rs\.\s*([\d\.]+)(?:\s+per\s+unit)?"
-SCHEME_TAIL_RE = r"(\n.+?)(?:\t\t|$)"
-
-
-DEMAT_STATEMENT_PERIOD_RE = (
-    r"for\s+the\s+period\s+from\s+(?P<from>\d{2}-[a-zA-Z0-9]{2,3}-\d{4})"
-    r"\s+to\s+(?P<to>\d{2}-[a-zA-Z0-9]{2,3}-\d{4})"
-)
-DEMAT_HEADER_RE = (
-    r"((?:CDSL|NSDL)\s+demat\s+account)\s+(.+?)\s*DP\s*Id\s*:\s*(.+?)"
-    r"\s*Client\s*Id\s*:\s*(\d+)\s+(\d+)\s+([\d,.]+)"
-)
-DEMAT_MF_HEADER_RE = r"Mutual Fund Folios\s+(\d+)\s+folios\s+(\d+)\s+([\d,.]+)"
-DEMAT_AC_TYPE_RE = r"^(NSDL|CDSL)\s+demat\s+account|Mutual\s+Fund\s+Folios\s+\(F\)"
-DEMAT_MF_TYPE_RE = r"^Mutual\s+Fund\s+Folios\s+\(F\)$"
-DEMAT_AC_HOLDER_RE = r"([^\t\n]+?)\s*\(PAN\s*:\s*(.+?)\)"
-DEMAT_DP_ID_RE = r"DP\s*Id\s*:\s*(.+?)\s*Client\s*Id\s*:\s*(\d+).+PAN"
-NSDL_EQ_RE = (
-    rf"^([A-Z]{{2}}[E|9][0-9A-Z]{{8}}[0-9]{{1}})"
-    rf"\s*(.+?)\s*{amt_re}\s+([\d,.]+)\s+{amt_re}\s+{amt_re}$"
-)
-NSDL_MF_RE = rf"^(INF[0-9A-Z]{{8}}[0-9]{{1}})\s*(.*?)\s*{amt_re}\s+{amt_re}\s+{amt_re}$"
-NSDL_CDSL_HOLDINGS_RE = (
-    r"^([A-Z]{2}[0-9A-Z]{9}[0-9]{1})\s*(.+?)\s+" + rf"{amt_re}\s+" * 10 + rf"{amt_re}$"
-)
-NSDL_MF_HOLDINGS_RE = (
-    rf"({isin_re})[\n\t]+(.+?)[\n\t]+(.+?)[\n\t]+(\d{{4,}}?)[\n\t]+{amt_re}"
-    rf"[\n\t]+{amt_re}[\n\t]+{amt_re}[\n\t]+{amt_re}[\n\t]+{amt_re}[\n\t]+{amt_re}(?:[\n\t]+{amt_re})?$"
-)
diff --git a/casparser/process/utils.py b/casparser/process/utils.py
deleted file mode 100644
index 10a6932..0000000
--- a/casparser/process/utils.py
+++ /dev/null
@@ -1,32 +0,0 @@
-from typing import Optional, Tuple
-
-from casparser_isin import MFISINDb
-
-
-def isin_search(
-    scheme_name: str,
-    rta: str,
-    rta_code: str,
-    isin: Optional[str] = None,
-) -> Tuple[Optional[str], Optional[str], Optional[str]]:
-    """
-    Search isin db for ISIN and AMFI code.
-
-    The underlying ``MFISINDb.isin_lookup`` does ISIN-first lookup
-    internally when ``isin`` is supplied, but only after validating
-    that ``rta`` is one of the known RTAs (CAMS / KARVY / FRANKLIN).
-    The RTA check is deliberate -- if it trips, the parser captured a
-    malformed RTA upstream and the right fix is to repair the parser,
-    not to bypass the validation here.
-
-    :param isin: Scheme ISIN code (from the scheme line, if present).
-    :param scheme_name: Scheme name from CAS.
-    :param rta: RTA for the scheme.
-    :param rta_code: Scheme RTA code.
-    """
-    try:
-        with MFISINDb() as db:
-            scheme_data = db.isin_lookup(scheme_name, rta, rta_code, isin=isin)
-            return scheme_data.isin, scheme_data.amfi_code, scheme_data.type
-    except ValueError:
-        return None, None, None
diff --git a/casparser/types.py b/casparser/types.py
index 3a7d020..92da585 100644
--- a/casparser/types.py
+++ b/casparser/types.py
@@ -87,20 +87,6 @@ class CASData(BaseModel):
     )
 
 
-class PartialCASData(BaseModel):
-    """CAS Parser return data type."""
-
-    investor_info: InvestorInfo
-    file_type: FileType
-    lines: List[str]
-
-
-class ProcessedCASData(BaseModel):
-    cas_type: CASFileType
-    folios: List[Folio]
-    statement_period: StatementPeriod
-
-
 class DematOwner(BaseModel):
     name: str
     PAN: str
@@ -122,6 +108,47 @@ def fix_float(cls, data: dict):
         return data
 
 
+class Bond(BaseModel):
+    """Corporate / government bond holding.
+
+    Two source layouts feed this model — both are present in the same
+    NSDL CAS, one per demat-account flavour:
+
+    - **NSDL-account summary form** (8 data cells):
+      `ISIN | name | frequency | coupon_rate | maturity | num_bonds |
+      face_value | value`. All optional fields populated.
+    - **CDSL-account detailed form** (13 data cells, identical layout to
+      detailed equity rows): we only get `num_bonds`, `market_price`,
+      `value`. `coupon_rate`/`frequency`/`maturity`/`face_value` are
+      `None` here — the detailed table doesn't include them.
+    """
+
+    name: Optional[str] = None
+    isin: str
+    num_bonds: Decimal
+    value: Decimal
+    face_value: Optional[Decimal] = None
+    coupon_rate: Optional[Decimal] = None
+    coupon_frequency: Optional[str] = None
+    maturity_date: Optional[str] = None
+    market_price: Optional[Decimal] = None
+
+    @model_validator(mode="before")
+    @classmethod
+    def fix_float(cls, data: dict):
+        for k, v in data.items():
+            try:
+                if issubclass(Decimal, cls.__annotations__[k]) and isinstance(v, str):
+                    data[k] = v.replace(",", "_").replace("_", "")
+            except TypeError:
+                # Optional[Decimal] / Union annotations land here; the
+                # parser already strips commas before constructing the
+                # model, so this is just a safety-net for required
+                # Decimal fields.
+                pass
+        return data
+
+
 class MutualFund(BaseModel):
     name: Optional[str] = None
     isin: str
@@ -164,6 +191,7 @@ class DematAccount(BaseModel):
     owners: List[DematOwner]
     equities: List[Equity]
     mutual_funds: List[MutualFund]
+    bonds: List[Bond] = []
 
     @model_validator(mode="before")
     @classmethod
@@ -180,8 +208,8 @@ def fix_float(cls, data: dict):
 class NSDLCASData(BaseModel):
     accounts: List[DematAccount]
     statement_period: StatementPeriod
-    investor_info: Optional[InvestorInfo] = None
-    file_type: Optional[FileType] = None
+    investor_info: InvestorInfo
+    file_type: FileType
     model_config = ConfigDict(
         populate_by_name=True,
         use_enum_values=True,
diff --git a/licenses/AGPL-3.0+.txt b/licenses/AGPL-3.0+.txt
deleted file mode 100644
index a028880..0000000
--- a/licenses/AGPL-3.0+.txt
+++ /dev/null
@@ -1,661 +0,0 @@
-GNU AFFERO GENERAL PUBLIC LICENSE
-                       Version 3, 19 November 2007
-
- Copyright (C) 2007 Free Software Foundation, Inc. <https://fsf.org/>
- Everyone is permitted to copy and distribute verbatim copies
- of this license document, but changing it is not allowed.
-
-                            Preamble
-
-  The GNU Affero General Public License is a free, copyleft license for
-software and other kinds of works, specifically designed to ensure
-cooperation with the community in the case of network server software.
-
-  The licenses for most software and other practical works are designed
-to take away your freedom to share and change the works.  By contrast,
-our General Public Licenses are intended to guarantee your freedom to
-share and change all versions of a program--to make sure it remains free
-software for all its users.
-
-  When we speak of free software, we are referring to freedom, not
-price.  Our General Public Licenses are designed to make sure that you
-have the freedom to distribute copies of free software (and charge for
-them if you wish), that you receive source code or can get it if you
-want it, that you can change the software or use pieces of it in new
-free programs, and that you know you can do these things.
-
-  Developers that use our General Public Licenses protect your rights
-with two steps: (1) assert copyright on the software, and (2) offer
-you this License which gives you legal permission to copy, distribute
-and/or modify the software.
-
-  A secondary benefit of defending all users' freedom is that
-improvements made in alternate versions of the program, if they
-receive widespread use, become available for other developers to
-incorporate.  Many developers of free software are heartened and
-encouraged by the resulting cooperation.  However, in the case of
-software used on network servers, this result may fail to come about.
-The GNU General Public License permits making a modified version and
-letting the public access it on a server without ever releasing its
-source code to the public.
-
-  The GNU Affero General Public License is designed specifically to
-ensure that, in such cases, the modified source code becomes available
-to the community.  It requires the operator of a network server to
-provide the source code of the modified version running there to the
-users of that server.  Therefore, public use of a modified version, on
-a publicly accessible server, gives the public access to the source
-code of the modified version.
-
-  An older license, called the Affero General Public License and
-published by Affero, was designed to accomplish similar goals.  This is
-a different license, not a version of the Affero GPL, but Affero has
-released a new version of the Affero GPL which permits relicensing under
-this license.
-
-  The precise terms and conditions for copying, distribution and
-modification follow.
-
-                       TERMS AND CONDITIONS
-
-  0. Definitions.
-
-  "This License" refers to version 3 of the GNU Affero General Public License.
-
-  "Copyright" also means copyright-like laws that apply to other kinds of
-works, such as semiconductor masks.
-
-  "The Program" refers to any copyrightable work licensed under this
-License.  Each licensee is addressed as "you".  "Licensees" and
-"recipients" may be individuals or organizations.
-
-  To "modify" a work means to copy from or adapt all or part of the work
-in a fashion requiring copyright permission, other than the making of an
-exact copy.  The resulting work is called a "modified version" of the
-earlier work or a work "based on" the earlier work.
-
-  A "covered work" means either the unmodified Program or a work based
-on the Program.
-
-  To "propagate" a work means to do anything with it that, without
-permission, would make you directly or secondarily liable for
-infringement under applicable copyright law, except executing it on a
-computer or modifying a private copy.  Propagation includes copying,
-distribution (with or without modification), making available to the
-public, and in some countries other activities as well.
-
-  To "convey" a work means any kind of propagation that enables other
-parties to make or receive copies.  Mere interaction with a user through
-a computer network, with no transfer of a copy, is not conveying.
-
-  An interactive user interface displays "Appropriate Legal Notices"
-to the extent that it includes a convenient and prominently visible
-feature that (1) displays an appropriate copyright notice, and (2)
-tells the user that there is no warranty for the work (except to the
-extent that warranties are provided), that licensees may convey the
-work under this License, and how to view a copy of this License.  If
-the interface presents a list of user commands or options, such as a
-menu, a prominent item in the list meets this criterion.
-
-  1. Source Code.
-
-  The "source code" for a work means the preferred form of the work
-for making modifications to it.  "Object code" means any non-source
-form of a work.
-
-  A "Standard Interface" means an interface that either is an official
-standard defined by a recognized standards body, or, in the case of
-interfaces specified for a particular programming language, one that
-is widely used among developers working in that language.
-
-  The "System Libraries" of an executable work include anything, other
-than the work as a whole, that (a) is included in the normal form of
-packaging a Major Component, but which is not part of that Major
-Component, and (b) serves only to enable use of the work with that
-Major Component, or to implement a Standard Interface for which an
-implementation is available to the public in source code form.  A
-"Major Component", in this context, means a major essential component
-(kernel, window system, and so on) of the specific operating system
-(if any) on which the executable work runs, or a compiler used to
-produce the work, or an object code interpreter used to run it.
-
-  The "Corresponding Source" for a work in object code form means all
-the source code needed to generate, install, and (for an executable
-work) run the object code and to modify the work, including scripts to
-control those activities.  However, it does not include the work's
-System Libraries, or general-purpose tools or generally available free
-programs which are used unmodified in performing those activities but
-which are not part of the work.  For example, Corresponding Source
-includes interface definition files associated with source files for
-the work, and the source code for shared libraries and dynamically
-linked subprograms that the work is specifically designed to require,
-such as by intimate data communication or control flow between those
-subprograms and other parts of the work.
-
-  The Corresponding Source need not include anything that users
-can regenerate automatically from other parts of the Corresponding
-Source.
-
-  The Corresponding Source for a work in source code form is that
-same work.
-
-  2. Basic Permissions.
-
-  All rights granted under this License are granted for the term of
-copyright on the Program, and are irrevocable provided the stated
-conditions are met.  This License explicitly affirms your unlimited
-permission to run the unmodified Program.  The output from running a
-covered work is covered by this License only if the output, given its
-content, constitutes a covered work.  This License acknowledges your
-rights of fair use or other equivalent, as provided by copyright law.
-
-  You may make, run and propagate covered works that you do not
-convey, without conditions so long as your license otherwise remains
-in force.  You may convey covered works to others for the sole purpose
-of having them make modifications exclusively for you, or provide you
-with facilities for running those works, provided that you comply with
-the terms of this License in conveying all material for which you do
-not control copyright.  Those thus making or running the covered works
-for you must do so exclusively on your behalf, under your direction
-and control, on terms that prohibit them from making any copies of
-your copyrighted material outside their relationship with you.
-
-  Conveying under any other circumstances is permitted solely under
-the conditions stated below.  Sublicensing is not allowed; section 10
-makes it unnecessary.
-
-  3. Protecting Users' Legal Rights From Anti-Circumvention Law.
-
-  No covered work shall be deemed part of an effective technological
-measure under any applicable law fulfilling obligations under article
-11 of the WIPO copyright treaty adopted on 20 December 1996, or
-similar laws prohibiting or restricting circumvention of such
-measures.
-
-  When you convey a covered work, you waive any legal power to forbid
-circumvention of technological measures to the extent such circumvention
-is effected by exercising rights under this License with respect to
-the covered work, and you disclaim any intention to limit operation or
-modification of the work as a means of enforcing, against the work's
-users, your or third parties' legal rights to forbid circumvention of
-technological measures.
-
-  4. Conveying Verbatim Copies.
-
-  You may convey verbatim copies of the Program's source code as you
-receive it, in any medium, provided that you conspicuously and
-appropriately publish on each copy an appropriate copyright notice;
-keep intact all notices stating that this License and any
-non-permissive terms added in accord with section 7 apply to the code;
-keep intact all notices of the absence of any warranty; and give all
-recipients a copy of this License along with the Program.
-
-  You may charge any price or no price for each copy that you convey,
-and you may offer support or warranty protection for a fee.
-
-  5. Conveying Modified Source Versions.
-
-  You may convey a work based on the Program, or the modifications to
-produce it from the Program, in the form of source code under the
-terms of section 4, provided that you also meet all of these conditions:
-
-    a) The work must carry prominent notices stating that you modified
-    it, and giving a relevant date.
-
-    b) The work must carry prominent notices stating that it is
-    released under this License and any conditions added under section
-    7.  This requirement modifies the requirement in section 4 to
-    "keep intact all notices".
-
-    c) You must license the entire work, as a whole, under this
-    License to anyone who comes into possession of a copy.  This
-    License will therefore apply, along with any applicable section 7
-    additional terms, to the whole of the work, and all its parts,
-    regardless of how they are packaged.  This License gives no
-    permission to license the work in any other way, but it does not
-    invalidate such permission if you have separately received it.
-
-    d) If the work has interactive user interfaces, each must display
-    Appropriate Legal Notices; however, if the Program has interactive
-    interfaces that do not display Appropriate Legal Notices, your
-    work need not make them do so.
-
-  A compilation of a covered work with other separate and independent
-works, which are not by their nature extensions of the covered work,
-and which are not combined with it such as to form a larger program,
-in or on a volume of a storage or distribution medium, is called an
-"aggregate" if the compilation and its resulting copyright are not
-used to limit the access or legal rights of the compilation's users
-beyond what the individual works permit.  Inclusion of a covered work
-in an aggregate does not cause this License to apply to the other
-parts of the aggregate.
-
-  6. Conveying Non-Source Forms.
-
-  You may convey a covered work in object code form under the terms
-of sections 4 and 5, provided that you also convey the
-machine-readable Corresponding Source under the terms of this License,
-in one of these ways:
-
-    a) Convey the object code in, or embodied in, a physical product
-    (including a physical distribution medium), accompanied by the
-    Corresponding Source fixed on a durable physical medium
-    customarily used for software interchange.
-
-    b) Convey the object code in, or embodied in, a physical product
-    (including a physical distribution medium), accompanied by a
-    written offer, valid for at least three years and valid for as
-    long as you offer spare parts or customer support for that product
-    model, to give anyone who possesses the object code either (1) a
-    copy of the Corresponding Source for all the software in the
-    product that is covered by this License, on a durable physical
-    medium customarily used for software interchange, for a price no
-    more than your reasonable cost of physically performing this
-    conveying of source, or (2) access to copy the
-    Corresponding Source from a network server at no charge.
-
-    c) Convey individual copies of the object code with a copy of the
-    written offer to provide the Corresponding Source.  This
-    alternative is allowed only occasionally and noncommercially, and
-    only if you received the object code with such an offer, in accord
-    with subsection 6b.
-
-    d) Convey the object code by offering access from a designated
-    place (gratis or for a charge), and offer equivalent access to the
-    Corresponding Source in the same way through the same place at no
-    further charge.  You need not require recipients to copy the
-    Corresponding Source along with the object code.  If the place to
-    copy the object code is a network server, the Corresponding Source
-    may be on a different server (operated by you or a third party)
-    that supports equivalent copying facilities, provided you maintain
-    clear directions next to the object code saying where to find the
-    Corresponding Source.  Regardless of what server hosts the
-    Corresponding Source, you remain obligated to ensure that it is
-    available for as long as needed to satisfy these requirements.
-
-    e) Convey the object code using peer-to-peer transmission, provided
-    you inform other peers where the object code and Corresponding
-    Source of the work are being offered to the general public at no
-    charge under subsection 6d.
-
-  A separable portion of the object code, whose source code is excluded
-from the Corresponding Source as a System Library, need not be
-included in conveying the object code work.
-
-  A "User Product" is either (1) a "consumer product", which means any
-tangible personal property which is normally used for personal, family,
-or household purposes, or (2) anything designed or sold for incorporation
-into a dwelling.  In determining whether a product is a consumer product,
-doubtful cases shall be resolved in favor of coverage.  For a particular
-product received by a particular user, "normally used" refers to a
-typical or common use of that class of product, regardless of the status
-of the particular user or of the way in which the particular user
-actually uses, or expects or is expected to use, the product.  A product
-is a consumer product regardless of whether the product has substantial
-commercial, industrial or non-consumer uses, unless such uses represent
-the only significant mode of use of the product.
-
-  "Installation Information" for a User Product means any methods,
-procedures, authorization keys, or other information required to install
-and execute modified versions of a covered work in that User Product from
-a modified version of its Corresponding Source.  The information must
-suffice to ensure that the continued functioning of the modified object
-code is in no case prevented or interfered with solely because
-modification has been made.
-
-  If you convey an object code work under this section in, or with, or
-specifically for use in, a User Product, and the conveying occurs as
-part of a transaction in which the right of possession and use of the
-User Product is transferred to the recipient in perpetuity or for a
-fixed term (regardless of how the transaction is characterized), the
-Corresponding Source conveyed under this section must be accompanied
-by the Installation Information.  But this requirement does not apply
-if neither you nor any third party retains the ability to install
-modified object code on the User Product (for example, the work has
-been installed in ROM).
-
-  The requirement to provide Installation Information does not include a
-requirement to continue to provide support service, warranty, or updates
-for a work that has been modified or installed by the recipient, or for
-the User Product in which it has been modified or installed.  Access to a
-network may be denied when the modification itself materially and
-adversely affects the operation of the network or violates the rules and
-protocols for communication across the network.
-
-  Corresponding Source conveyed, and Installation Information provided,
-in accord with this section must be in a format that is publicly
-documented (and with an implementation available to the public in
-source code form), and must require no special password or key for
-unpacking, reading or copying.
-
-  7. Additional Terms.
-
-  "Additional permissions" are terms that supplement the terms of this
-License by making exceptions from one or more of its conditions.
-Additional permissions that are applicable to the entire Program shall
-be treated as though they were included in this License, to the extent
-that they are valid under applicable law.  If additional permissions
-apply only to part of the Program, that part may be used separately
-under those permissions, but the entire Program remains governed by
-this License without regard to the additional permissions.
-
-  When you convey a copy of a covered work, you may at your option
-remove any additional permissions from that copy, or from any part of
-it.  (Additional permissions may be written to require their own
-removal in certain cases when you modify the work.)  You may place
-additional permissions on material, added by you to a covered work,
-for which you have or can give appropriate copyright permission.
-
-  Notwithstanding any other provision of this License, for material you
-add to a covered work, you may (if authorized by the copyright holders of
-that material) supplement the terms of this License with terms:
-
-    a) Disclaiming warranty or limiting liability differently from the
-    terms of sections 15 and 16 of this License; or
-
-    b) Requiring preservation of specified reasonable legal notices or
-    author attributions in that material or in the Appropriate Legal
-    Notices displayed by works containing it; or
-
-    c) Prohibiting misrepresentation of the origin of that material, or
-    requiring that modified versions of such material be marked in
-    reasonable ways as different from the original version; or
-
-    d) Limiting the use for publicity purposes of names of licensors or
-    authors of the material; or
-
-    e) Declining to grant rights under trademark law for use of some
-    trade names, trademarks, or service marks; or
-
-    f) Requiring indemnification of licensors and authors of that
-    material by anyone who conveys the material (or modified versions of
-    it) with contractual assumptions of liability to the recipient, for
-    any liability that these contractual assumptions directly impose on
-    those licensors and authors.
-
-  All other non-permissive additional terms are considered "further
-restrictions" within the meaning of section 10.  If the Program as you
-received it, or any part of it, contains a notice stating that it is
-governed by this License along with a term that is a further
-restriction, you may remove that term.  If a license document contains
-a further restriction but permits relicensing or conveying under this
-License, you may add to a covered work material governed by the terms
-of that license document, provided that the further restriction does
-not survive such relicensing or conveying.
-
-  If you add terms to a covered work in accord with this section, you
-must place, in the relevant source files, a statement of the
-additional terms that apply to those files, or a notice indicating
-where to find the applicable terms.
-
-  Additional terms, permissive or non-permissive, may be stated in the
-form of a separately written license, or stated as exceptions;
-the above requirements apply either way.
-
-  8. Termination.
-
-  You may not propagate or modify a covered work except as expressly
-provided under this License.  Any attempt otherwise to propagate or
-modify it is void, and will automatically terminate your rights under
-this License (including any patent licenses granted under the third
-paragraph of section 11).
-
-  However, if you cease all violation of this License, then your
-license from a particular copyright holder is reinstated (a)
-provisionally, unless and until the copyright holder explicitly and
-finally terminates your license, and (b) permanently, if the copyright
-holder fails to notify you of the violation by some reasonable means
-prior to 60 days after the cessation.
-
-  Moreover, your license from a particular copyright holder is
-reinstated permanently if the copyright holder notifies you of the
-violation by some reasonable means, this is the first time you have
-received notice of violation of this License (for any work) from that
-copyright holder, and you cure the violation prior to 30 days after
-your receipt of the notice.
-
-  Termination of your rights under this section does not terminate the
-licenses of parties who have received copies or rights from you under
-this License.  If your rights have been terminated and not permanently
-reinstated, you do not qualify to receive new licenses for the same
-material under section 10.
-
-  9. Acceptance Not Required for Having Copies.
-
-  You are not required to accept this License in order to receive or
-run a copy of the Program.  Ancillary propagation of a covered work
-occurring solely as a consequence of using peer-to-peer transmission
-to receive a copy likewise does not require acceptance.  However,
-nothing other than this License grants you permission to propagate or
-modify any covered work.  These actions infringe copyright if you do
-not accept this License.  Therefore, by modifying or propagating a
-covered work, you indicate your acceptance of this License to do so.
-
-  10. Automatic Licensing of Downstream Recipients.
-
-  Each time you convey a covered work, the recipient automatically
-receives a license from the original licensors, to run, modify and
-propagate that work, subject to this License.  You are not responsible
-for enforcing compliance by third parties with this License.
-
-  An "entity transaction" is a transaction transferring control of an
-organization, or substantially all assets of one, or subdividing an
-organization, or merging organizations.  If propagation of a covered
-work results from an entity transaction, each party to that
-transaction who receives a copy of the work also receives whatever
-licenses to the work the party's predecessor in interest had or could
-give under the previous paragraph, plus a right to possession of the
-Corresponding Source of the work from the predecessor in interest, if
-the predecessor has it or can get it with reasonable efforts.
-
-  You may not impose any further restrictions on the exercise of the
-rights granted or affirmed under this License.  For example, you may
-not impose a license fee, royalty, or other charge for exercise of
-rights granted under this License, and you may not initiate litigation
-(including a cross-claim or counterclaim in a lawsuit) alleging that
-any patent claim is infringed by making, using, selling, offering for
-sale, or importing the Program or any portion of it.
-
-  11. Patents.
-
-  A "contributor" is a copyright holder who authorizes use under this
-License of the Program or a work on which the Program is based.  The
-work thus licensed is called the contributor's "contributor version".
-
-  A contributor's "essential patent claims" are all patent claims
-owned or controlled by the contributor, whether already acquired or
-hereafter acquired, that would be infringed by some manner, permitted
-by this License, of making, using, or selling its contributor version,
-but do not include claims that would be infringed only as a
-consequence of further modification of the contributor version.  For
-purposes of this definition, "control" includes the right to grant
-patent sublicenses in a manner consistent with the requirements of
-this License.
-
-  Each contributor grants you a non-exclusive, worldwide, royalty-free
-patent license under the contributor's essential patent claims, to
-make, use, sell, offer for sale, import and otherwise run, modify and
-propagate the contents of its contributor version.
-
-  In the following three paragraphs, a "patent license" is any express
-agreement or commitment, however denominated, not to enforce a patent
-(such as an express permission to practice a patent or covenant not to
-sue for patent infringement).  To "grant" such a patent license to a
-party means to make such an agreement or commitment not to enforce a
-patent against the party.
-
-  If you convey a covered work, knowingly relying on a patent license,
-and the Corresponding Source of the work is not available for anyone
-to copy, free of charge and under the terms of this License, through a
-publicly available network server or other readily accessible means,
-then you must either (1) cause the Corresponding Source to be so
-available, or (2) arrange to deprive yourself of the benefit of the
-patent license for this particular work, or (3) arrange, in a manner
-consistent with the requirements of this License, to extend the patent
-license to downstream recipients.  "Knowingly relying" means you have
-actual knowledge that, but for the patent license, your conveying the
-covered work in a country, or your recipient's use of the covered work
-in a country, would infringe one or more identifiable patents in that
-country that you have reason to believe are valid.
-
-  If, pursuant to or in connection with a single transaction or
-arrangement, you convey, or propagate by procuring conveyance of, a
-covered work, and grant a patent license to some of the parties
-receiving the covered work authorizing them to use, propagate, modify
-or convey a specific copy of the covered work, then the patent license
-you grant is automatically extended to all recipients of the covered
-work and works based on it.
-
-  A patent license is "discriminatory" if it does not include within
-the scope of its coverage, prohibits the exercise of, or is
-conditioned on the non-exercise of one or more of the rights that are
-specifically granted under this License.  You may not convey a covered
-work if you are a party to an arrangement with a third party that is
-in the business of distributing software, under which you make payment
-to the third party based on the extent of your activity of conveying
-the work, and under which the third party grants, to any of the
-parties who would receive the covered work from you, a discriminatory
-patent license (a) in connection with copies of the covered work
-conveyed by you (or copies made from those copies), or (b) primarily
-for and in connection with specific products or compilations that
-contain the covered work, unless you entered into that arrangement,
-or that patent license was granted, prior to 28 March 2007.
-
-  Nothing in this License shall be construed as excluding or limiting
-any implied license or other defenses to infringement that may
-otherwise be available to you under applicable patent law.
-
-  12. No Surrender of Others' Freedom.
-
-  If conditions are imposed on you (whether by court order, agreement or
-otherwise) that contradict the conditions of this License, they do not
-excuse you from the conditions of this License.  If you cannot convey a
-covered work so as to satisfy simultaneously your obligations under this
-License and any other pertinent obligations, then as a consequence you may
-not convey it at all.  For example, if you agree to terms that obligate you
-to collect a royalty for further conveying from those to whom you convey
-the Program, the only way you could satisfy both those terms and this
-License would be to refrain entirely from conveying the Program.
-
-  13. Remote Network Interaction; Use with the GNU General Public License.
-
-  Notwithstanding any other provision of this License, if you modify the
-Program, your modified version must prominently offer all users
-interacting with it remotely through a computer network (if your version
-supports such interaction) an opportunity to receive the Corresponding
-Source of your version by providing access to the Corresponding Source
-from a network server at no charge, through some standard or customary
-means of facilitating copying of software.  This Corresponding Source
-shall include the Corresponding Source for any work covered by version 3
-of the GNU General Public License that is incorporated pursuant to the
-following paragraph.
-
-  Notwithstanding any other provision of this License, you have
-permission to link or combine any covered work with a work licensed
-under version 3 of the GNU General Public License into a single
-combined work, and to convey the resulting work.  The terms of this
-License will continue to apply to the part which is the covered work,
-but the work with which it is combined will remain governed by version
-3 of the GNU General Public License.
-
-  14. Revised Versions of this License.
-
-  The Free Software Foundation may publish revised and/or new versions of
-the GNU Affero General Public License from time to time.  Such new versions
-will be similar in spirit to the present version, but may differ in detail to
-address new problems or concerns.
-
-  Each version is given a distinguishing version number.  If the
-Program specifies that a certain numbered version of the GNU Affero General
-Public License "or any later version" applies to it, you have the
-option of following the terms and conditions either of that numbered
-version or of any later version published by the Free Software
-Foundation.  If the Program does not specify a version number of the
-GNU Affero General Public License, you may choose any version ever published
-by the Free Software Foundation.
-
-  If the Program specifies that a proxy can decide which future
-versions of the GNU Affero General Public License can be used, that proxy's
-public statement of acceptance of a version permanently authorizes you
-to choose that version for the Program.
-
-  Later license versions may give you additional or different
-permissions.  However, no additional obligations are imposed on any
-author or copyright holder as a result of your choosing to follow a
-later version.
-
-  15. Disclaimer of Warranty.
-
-  THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY
-APPLICABLE LAW.  EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT
-HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY
-OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO,
-THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
-PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM
-IS WITH YOU.  SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF
-ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
-
-  16. Limitation of Liability.
-
-  IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
-WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS
-THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY
-GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE
-USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF
-DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD
-PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS),
-EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF
-SUCH DAMAGES.
-
-  17. Interpretation of Sections 15 and 16.
-
-  If the disclaimer of warranty and limitation of liability provided
-above cannot be given local legal effect according to their terms,
-reviewing courts shall apply local law that most closely approximates
-an absolute waiver of all civil liability in connection with the
-Program, unless a warranty or assumption of liability accompanies a
-copy of the Program in return for a fee.
-
-                     END OF TERMS AND CONDITIONS
-
-            How to Apply These Terms to Your New Programs
-
-  If you develop a new program, and you want it to be of the greatest
-possible use to the public, the best way to achieve this is to make it
-free software which everyone can redistribute and change under these terms.
-
-  To do so, attach the following notices to the program.  It is safest
-to attach them to the start of each source file to most effectively
-state the exclusion of warranty; and each file should have at least
-the "copyright" line and a pointer to where the full notice is found.
-
-    <one line to give the program's name and a brief idea of what it does.>
-    Copyright (C) <year>  <name of author>
-
-    This program is free software: you can redistribute it and/or modify
-    it under the terms of the GNU Affero General Public License as published by
-    the Free Software Foundation, either version 3 of the License, or
-    (at your option) any later version.
-
-    This program is distributed in the hope that it will be useful,
-    but WITHOUT ANY WARRANTY; without even the implied warranty of
-    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-    GNU Affero General Public License for more details.
-
-    You should have received a copy of the GNU Affero General Public License
-    along with this program.  If not, see <https://www.gnu.org/licenses/>.
-
-Also add information on how to contact you by electronic and paper mail.
-
-  If your software can interact with users remotely through a computer
-network, you should also make sure that it provides a way for users to
-get its source.  For example, if your program is a web application, its
-interface could display a "Source" link that leads users to an archive
-of the code.  There are many ways you could offer source, and different
-solutions will be better for different programs; see section 13 for the
-specific requirements.
-
-  You should also get your employer (if you work as a programmer) or school,
-if any, to sign a "copyright disclaimer" for the program, if necessary.
-For more information on this, and how to apply and follow the GNU AGPL, see
-<https://www.gnu.org/licenses/>.
diff --git a/licenses/GPL-3.0+.txt b/licenses/GPL-3.0+.txt
deleted file mode 100644
index 92b370f..0000000
--- a/licenses/GPL-3.0+.txt
+++ /dev/null
@@ -1,674 +0,0 @@
-GNU GENERAL PUBLIC LICENSE
-                       Version 3, 29 June 2007
-
- Copyright (C) 2007 Free Software Foundation, Inc. <http://fsf.org/>
- Everyone is permitted to copy and distribute verbatim copies
- of this license document, but changing it is not allowed.
-
-                            Preamble
-
-  The GNU General Public License is a free, copyleft license for
-software and other kinds of works.
-
-  The licenses for most software and other practical works are designed
-to take away your freedom to share and change the works.  By contrast,
-the GNU General Public License is intended to guarantee your freedom to
-share and change all versions of a program--to make sure it remains free
-software for all its users.  We, the Free Software Foundation, use the
-GNU General Public License for most of our software; it applies also to
-any other work released this way by its authors.  You can apply it to
-your programs, too.
-
-  When we speak of free software, we are referring to freedom, not
-price.  Our General Public Licenses are designed to make sure that you
-have the freedom to distribute copies of free software (and charge for
-them if you wish), that you receive source code or can get it if you
-want it, that you can change the software or use pieces of it in new
-free programs, and that you know you can do these things.
-
-  To protect your rights, we need to prevent others from denying you
-these rights or asking you to surrender the rights.  Therefore, you have
-certain responsibilities if you distribute copies of the software, or if
-you modify it: responsibilities to respect the freedom of others.
-
-  For example, if you distribute copies of such a program, whether
-gratis or for a fee, you must pass on to the recipients the same
-freedoms that you received.  You must make sure that they, too, receive
-or can get the source code.  And you must show them these terms so they
-know their rights.
-
-  Developers that use the GNU GPL protect your rights with two steps:
-(1) assert copyright on the software, and (2) offer you this License
-giving you legal permission to copy, distribute and/or modify it.
-
-  For the developers' and authors' protection, the GPL clearly explains
-that there is no warranty for this free software.  For both users' and
-authors' sake, the GPL requires that modified versions be marked as
-changed, so that their problems will not be attributed erroneously to
-authors of previous versions.
-
-  Some devices are designed to deny users access to install or run
-modified versions of the software inside them, although the manufacturer
-can do so.  This is fundamentally incompatible with the aim of
-protecting users' freedom to change the software.  The systematic
-pattern of such abuse occurs in the area of products for individuals to
-use, which is precisely where it is most unacceptable.  Therefore, we
-have designed this version of the GPL to prohibit the practice for those
-products.  If such problems arise substantially in other domains, we
-stand ready to extend this provision to those domains in future versions
-of the GPL, as needed to protect the freedom of users.
-
-  Finally, every program is threatened constantly by software patents.
-States should not allow patents to restrict development and use of
-software on general-purpose computers, but in those that do, we wish to
-avoid the special danger that patents applied to a free program could
-make it effectively proprietary.  To prevent this, the GPL assures that
-patents cannot be used to render the program non-free.
-
-  The precise terms and conditions for copying, distribution and
-modification follow.
-
-                       TERMS AND CONDITIONS
-
-  0. Definitions.
-
-  "This License" refers to version 3 of the GNU General Public License.
-
-  "Copyright" also means copyright-like laws that apply to other kinds of
-works, such as semiconductor masks.
-
-  "The Program" refers to any copyrightable work licensed under this
-License.  Each licensee is addressed as "you".  "Licensees" and
-"recipients" may be individuals or organizations.
-
-  To "modify" a work means to copy from or adapt all or part of the work
-in a fashion requiring copyright permission, other than the making of an
-exact copy.  The resulting work is called a "modified version" of the
-earlier work or a work "based on" the earlier work.
-
-  A "covered work" means either the unmodified Program or a work based
-on the Program.
-
-  To "propagate" a work means to do anything with it that, without
-permission, would make you directly or secondarily liable for
-infringement under applicable copyright law, except executing it on a
-computer or modifying a private copy.  Propagation includes copying,
-distribution (with or without modification), making available to the
-public, and in some countries other activities as well.
-
-  To "convey" a work means any kind of propagation that enables other
-parties to make or receive copies.  Mere interaction with a user through
-a computer network, with no transfer of a copy, is not conveying.
-
-  An interactive user interface displays "Appropriate Legal Notices"
-to the extent that it includes a convenient and prominently visible
-feature that (1) displays an appropriate copyright notice, and (2)
-tells the user that there is no warranty for the work (except to the
-extent that warranties are provided), that licensees may convey the
-work under this License, and how to view a copy of this License.  If
-the interface presents a list of user commands or options, such as a
-menu, a prominent item in the list meets this criterion.
-
-  1. Source Code.
-
-  The "source code" for a work means the preferred form of the work
-for making modifications to it.  "Object code" means any non-source
-form of a work.
-
-  A "Standard Interface" means an interface that either is an official
-standard defined by a recognized standards body, or, in the case of
-interfaces specified for a particular programming language, one that
-is widely used among developers working in that language.
-
-  The "System Libraries" of an executable work include anything, other
-than the work as a whole, that (a) is included in the normal form of
-packaging a Major Component, but which is not part of that Major
-Component, and (b) serves only to enable use of the work with that
-Major Component, or to implement a Standard Interface for which an
-implementation is available to the public in source code form.  A
-"Major Component", in this context, means a major essential component
-(kernel, window system, and so on) of the specific operating system
-(if any) on which the executable work runs, or a compiler used to
-produce the work, or an object code interpreter used to run it.
-
-  The "Corresponding Source" for a work in object code form means all
-the source code needed to generate, install, and (for an executable
-work) run the object code and to modify the work, including scripts to
-control those activities.  However, it does not include the work's
-System Libraries, or general-purpose tools or generally available free
-programs which are used unmodified in performing those activities but
-which are not part of the work.  For example, Corresponding Source
-includes interface definition files associated with source files for
-the work, and the source code for shared libraries and dynamically
-linked subprograms that the work is specifically designed to require,
-such as by intimate data communication or control flow between those
-subprograms and other parts of the work.
-
-  The Corresponding Source need not include anything that users
-can regenerate automatically from other parts of the Corresponding
-Source.
-
-  The Corresponding Source for a work in source code form is that
-same work.
-
-  2. Basic Permissions.
-
-  All rights granted under this License are granted for the term of
-copyright on the Program, and are irrevocable provided the stated
-conditions are met.  This License explicitly affirms your unlimited
-permission to run the unmodified Program.  The output from running a
-covered work is covered by this License only if the output, given its
-content, constitutes a covered work.  This License acknowledges your
-rights of fair use or other equivalent, as provided by copyright law.
-
-  You may make, run and propagate covered works that you do not
-convey, without conditions so long as your license otherwise remains
-in force.  You may convey covered works to others for the sole purpose
-of having them make modifications exclusively for you, or provide you
-with facilities for running those works, provided that you comply with
-the terms of this License in conveying all material for which you do
-not control copyright.  Those thus making or running the covered works
-for you must do so exclusively on your behalf, under your direction
-and control, on terms that prohibit them from making any copies of
-your copyrighted material outside their relationship with you.
-
-  Conveying under any other circumstances is permitted solely under
-the conditions stated below.  Sublicensing is not allowed; section 10
-makes it unnecessary.
-
-  3. Protecting Users' Legal Rights From Anti-Circumvention Law.
-
-  No covered work shall be deemed part of an effective technological
-measure under any applicable law fulfilling obligations under article
-11 of the WIPO copyright treaty adopted on 20 December 1996, or
-similar laws prohibiting or restricting circumvention of such
-measures.
-
-  When you convey a covered work, you waive any legal power to forbid
-circumvention of technological measures to the extent such circumvention
-is effected by exercising rights under this License with respect to
-the covered work, and you disclaim any intention to limit operation or
-modification of the work as a means of enforcing, against the work's
-users, your or third parties' legal rights to forbid circumvention of
-technological measures.
-
-  4. Conveying Verbatim Copies.
-
-  You may convey verbatim copies of the Program's source code as you
-receive it, in any medium, provided that you conspicuously and
-appropriately publish on each copy an appropriate copyright notice;
-keep intact all notices stating that this License and any
-non-permissive terms added in accord with section 7 apply to the code;
-keep intact all notices of the absence of any warranty; and give all
-recipients a copy of this License along with the Program.
-
-  You may charge any price or no price for each copy that you convey,
-and you may offer support or warranty protection for a fee.
-
-  5. Conveying Modified Source Versions.
-
-  You may convey a work based on the Program, or the modifications to
-produce it from the Program, in the form of source code under the
-terms of section 4, provided that you also meet all of these conditions:
-
-    a) The work must carry prominent notices stating that you modified
-    it, and giving a relevant date.
-
-    b) The work must carry prominent notices stating that it is
-    released under this License and any conditions added under section
-    7.  This requirement modifies the requirement in section 4 to
-    "keep intact all notices".
-
-    c) You must license the entire work, as a whole, under this
-    License to anyone who comes into possession of a copy.  This
-    License will therefore apply, along with any applicable section 7
-    additional terms, to the whole of the work, and all its parts,
-    regardless of how they are packaged.  This License gives no
-    permission to license the work in any other way, but it does not
-    invalidate such permission if you have separately received it.
-
-    d) If the work has interactive user interfaces, each must display
-    Appropriate Legal Notices; however, if the Program has interactive
-    interfaces that do not display Appropriate Legal Notices, your
-    work need not make them do so.
-
-  A compilation of a covered work with other separate and independent
-works, which are not by their nature extensions of the covered work,
-and which are not combined with it such as to form a larger program,
-in or on a volume of a storage or distribution medium, is called an
-"aggregate" if the compilation and its resulting copyright are not
-used to limit the access or legal rights of the compilation's users
-beyond what the individual works permit.  Inclusion of a covered work
-in an aggregate does not cause this License to apply to the other
-parts of the aggregate.
-
-  6. Conveying Non-Source Forms.
-
-  You may convey a covered work in object code form under the terms
-of sections 4 and 5, provided that you also convey the
-machine-readable Corresponding Source under the terms of this License,
-in one of these ways:
-
-    a) Convey the object code in, or embodied in, a physical product
-    (including a physical distribution medium), accompanied by the
-    Corresponding Source fixed on a durable physical medium
-    customarily used for software interchange.
-
-    b) Convey the object code in, or embodied in, a physical product
-    (including a physical distribution medium), accompanied by a
-    written offer, valid for at least three years and valid for as
-    long as you offer spare parts or customer support for that product
-    model, to give anyone who possesses the object code either (1) a
-    copy of the Corresponding Source for all the software in the
-    product that is covered by this License, on a durable physical
-    medium customarily used for software interchange, for a price no
-    more than your reasonable cost of physically performing this
-    conveying of source, or (2) access to copy the
-    Corresponding Source from a network server at no charge.
-
-    c) Convey individual copies of the object code with a copy of the
-    written offer to provide the Corresponding Source.  This
-    alternative is allowed only occasionally and noncommercially, and
-    only if you received the object code with such an offer, in accord
-    with subsection 6b.
-
-    d) Convey the object code by offering access from a designated
-    place (gratis or for a charge), and offer equivalent access to the
-    Corresponding Source in the same way through the same place at no
-    further charge.  You need not require recipients to copy the
-    Corresponding Source along with the object code.  If the place to
-    copy the object code is a network server, the Corresponding Source
-    may be on a different server (operated by you or a third party)
-    that supports equivalent copying facilities, provided you maintain
-    clear directions next to the object code saying where to find the
-    Corresponding Source.  Regardless of what server hosts the
-    Corresponding Source, you remain obligated to ensure that it is
-    available for as long as needed to satisfy these requirements.
-
-    e) Convey the object code using peer-to-peer transmission, provided
-    you inform other peers where the object code and Corresponding
-    Source of the work are being offered to the general public at no
-    charge under subsection 6d.
-
-  A separable portion of the object code, whose source code is excluded
-from the Corresponding Source as a System Library, need not be
-included in conveying the object code work.
-
-  A "User Product" is either (1) a "consumer product", which means any
-tangible personal property which is normally used for personal, family,
-or household purposes, or (2) anything designed or sold for incorporation
-into a dwelling.  In determining whether a product is a consumer product,
-doubtful cases shall be resolved in favor of coverage.  For a particular
-product received by a particular user, "normally used" refers to a
-typical or common use of that class of product, regardless of the status
-of the particular user or of the way in which the particular user
-actually uses, or expects or is expected to use, the product.  A product
-is a consumer product regardless of whether the product has substantial
-commercial, industrial or non-consumer uses, unless such uses represent
-the only significant mode of use of the product.
-
-  "Installation Information" for a User Product means any methods,
-procedures, authorization keys, or other information required to install
-and execute modified versions of a covered work in that User Product from
-a modified version of its Corresponding Source.  The information must
-suffice to ensure that the continued functioning of the modified object
-code is in no case prevented or interfered with solely because
-modification has been made.
-
-  If you convey an object code work under this section in, or with, or
-specifically for use in, a User Product, and the conveying occurs as
-part of a transaction in which the right of possession and use of the
-User Product is transferred to the recipient in perpetuity or for a
-fixed term (regardless of how the transaction is characterized), the
-Corresponding Source conveyed under this section must be accompanied
-by the Installation Information.  But this requirement does not apply
-if neither you nor any third party retains the ability to install
-modified object code on the User Product (for example, the work has
-been installed in ROM).
-
-  The requirement to provide Installation Information does not include a
-requirement to continue to provide support service, warranty, or updates
-for a work that has been modified or installed by the recipient, or for
-the User Product in which it has been modified or installed.  Access to a
-network may be denied when the modification itself materially and
-adversely affects the operation of the network or violates the rules and
-protocols for communication across the network.
-
-  Corresponding Source conveyed, and Installation Information provided,
-in accord with this section must be in a format that is publicly
-documented (and with an implementation available to the public in
-source code form), and must require no special password or key for
-unpacking, reading or copying.
-
-  7. Additional Terms.
-
-  "Additional permissions" are terms that supplement the terms of this
-License by making exceptions from one or more of its conditions.
-Additional permissions that are applicable to the entire Program shall
-be treated as though they were included in this License, to the extent
-that they are valid under applicable law.  If additional permissions
-apply only to part of the Program, that part may be used separately
-under those permissions, but the entire Program remains governed by
-this License without regard to the additional permissions.
-
-  When you convey a copy of a covered work, you may at your option
-remove any additional permissions from that copy, or from any part of
-it.  (Additional permissions may be written to require their own
-removal in certain cases when you modify the work.)  You may place
-additional permissions on material, added by you to a covered work,
-for which you have or can give appropriate copyright permission.
-
-  Notwithstanding any other provision of this License, for material you
-add to a covered work, you may (if authorized by the copyright holders of
-that material) supplement the terms of this License with terms:
-
-    a) Disclaiming warranty or limiting liability differently from the
-    terms of sections 15 and 16 of this License; or
-
-    b) Requiring preservation of specified reasonable legal notices or
-    author attributions in that material or in the Appropriate Legal
-    Notices displayed by works containing it; or
-
-    c) Prohibiting misrepresentation of the origin of that material, or
-    requiring that modified versions of such material be marked in
-    reasonable ways as different from the original version; or
-
-    d) Limiting the use for publicity purposes of names of licensors or
-    authors of the material; or
-
-    e) Declining to grant rights under trademark law for use of some
-    trade names, trademarks, or service marks; or
-
-    f) Requiring indemnification of licensors and authors of that
-    material by anyone who conveys the material (or modified versions of
-    it) with contractual assumptions of liability to the recipient, for
-    any liability that these contractual assumptions directly impose on
-    those licensors and authors.
-
-  All other non-permissive additional terms are considered "further
-restrictions" within the meaning of section 10.  If the Program as you
-received it, or any part of it, contains a notice stating that it is
-governed by this License along with a term that is a further
-restriction, you may remove that term.  If a license document contains
-a further restriction but permits relicensing or conveying under this
-License, you may add to a covered work material governed by the terms
-of that license document, provided that the further restriction does
-not survive such relicensing or conveying.
-
-  If you add terms to a covered work in accord with this section, you
-must place, in the relevant source files, a statement of the
-additional terms that apply to those files, or a notice indicating
-where to find the applicable terms.
-
-  Additional terms, permissive or non-permissive, may be stated in the
-form of a separately written license, or stated as exceptions;
-the above requirements apply either way.
-
-  8. Termination.
-
-  You may not propagate or modify a covered work except as expressly
-provided under this License.  Any attempt otherwise to propagate or
-modify it is void, and will automatically terminate your rights under
-this License (including any patent licenses granted under the third
-paragraph of section 11).
-
-  However, if you cease all violation of this License, then your
-license from a particular copyright holder is reinstated (a)
-provisionally, unless and until the copyright holder explicitly and
-finally terminates your license, and (b) permanently, if the copyright
-holder fails to notify you of the violation by some reasonable means
-prior to 60 days after the cessation.
-
-  Moreover, your license from a particular copyright holder is
-reinstated permanently if the copyright holder notifies you of the
-violation by some reasonable means, this is the first time you have
-received notice of violation of this License (for any work) from that
-copyright holder, and you cure the violation prior to 30 days after
-your receipt of the notice.
-
-  Termination of your rights under this section does not terminate the
-licenses of parties who have received copies or rights from you under
-this License.  If your rights have been terminated and not permanently
-reinstated, you do not qualify to receive new licenses for the same
-material under section 10.
-
-  9. Acceptance Not Required for Having Copies.
-
-  You are not required to accept this License in order to receive or
-run a copy of the Program.  Ancillary propagation of a covered work
-occurring solely as a consequence of using peer-to-peer transmission
-to receive a copy likewise does not require acceptance.  However,
-nothing other than this License grants you permission to propagate or
-modify any covered work.  These actions infringe copyright if you do
-not accept this License.  Therefore, by modifying or propagating a
-covered work, you indicate your acceptance of this License to do so.
-
-  10. Automatic Licensing of Downstream Recipients.
-
-  Each time you convey a covered work, the recipient automatically
-receives a license from the original licensors, to run, modify and
-propagate that work, subject to this License.  You are not responsible
-for enforcing compliance by third parties with this License.
-
-  An "entity transaction" is a transaction transferring control of an
-organization, or substantially all assets of one, or subdividing an
-organization, or merging organizations.  If propagation of a covered
-work results from an entity transaction, each party to that
-transaction who receives a copy of the work also receives whatever
-licenses to the work the party's predecessor in interest had or could
-give under the previous paragraph, plus a right to possession of the
-Corresponding Source of the work from the predecessor in interest, if
-the predecessor has it or can get it with reasonable efforts.
-
-  You may not impose any further restrictions on the exercise of the
-rights granted or affirmed under this License.  For example, you may
-not impose a license fee, royalty, or other charge for exercise of
-rights granted under this License, and you may not initiate litigation
-(including a cross-claim or counterclaim in a lawsuit) alleging that
-any patent claim is infringed by making, using, selling, offering for
-sale, or importing the Program or any portion of it.
-
-  11. Patents.
-
-  A "contributor" is a copyright holder who authorizes use under this
-License of the Program or a work on which the Program is based.  The
-work thus licensed is called the contributor's "contributor version".
-
-  A contributor's "essential patent claims" are all patent claims
-owned or controlled by the contributor, whether already acquired or
-hereafter acquired, that would be infringed by some manner, permitted
-by this License, of making, using, or selling its contributor version,
-but do not include claims that would be infringed only as a
-consequence of further modification of the contributor version.  For
-purposes of this definition, "control" includes the right to grant
-patent sublicenses in a manner consistent with the requirements of
-this License.
-
-  Each contributor grants you a non-exclusive, worldwide, royalty-free
-patent license under the contributor's essential patent claims, to
-make, use, sell, offer for sale, import and otherwise run, modify and
-propagate the contents of its contributor version.
-
-  In the following three paragraphs, a "patent license" is any express
-agreement or commitment, however denominated, not to enforce a patent
-(such as an express permission to practice a patent or covenant not to
-sue for patent infringement).  To "grant" such a patent license to a
-party means to make such an agreement or commitment not to enforce a
-patent against the party.
-
-  If you convey a covered work, knowingly relying on a patent license,
-and the Corresponding Source of the work is not available for anyone
-to copy, free of charge and under the terms of this License, through a
-publicly available network server or other readily accessible means,
-then you must either (1) cause the Corresponding Source to be so
-available, or (2) arrange to deprive yourself of the benefit of the
-patent license for this particular work, or (3) arrange, in a manner
-consistent with the requirements of this License, to extend the patent
-license to downstream recipients.  "Knowingly relying" means you have
-actual knowledge that, but for the patent license, your conveying the
-covered work in a country, or your recipient's use of the covered work
-in a country, would infringe one or more identifiable patents in that
-country that you have reason to believe are valid.
-
-  If, pursuant to or in connection with a single transaction or
-arrangement, you convey, or propagate by procuring conveyance of, a
-covered work, and grant a patent license to some of the parties
-receiving the covered work authorizing them to use, propagate, modify
-or convey a specific copy of the covered work, then the patent license
-you grant is automatically extended to all recipients of the covered
-work and works based on it.
-
-  A patent license is "discriminatory" if it does not include within
-the scope of its coverage, prohibits the exercise of, or is
-conditioned on the non-exercise of one or more of the rights that are
-specifically granted under this License.  You may not convey a covered
-work if you are a party to an arrangement with a third party that is
-in the business of distributing software, under which you make payment
-to the third party based on the extent of your activity of conveying
-the work, and under which the third party grants, to any of the
-parties who would receive the covered work from you, a discriminatory
-patent license (a) in connection with copies of the covered work
-conveyed by you (or copies made from those copies), or (b) primarily
-for and in connection with specific products or compilations that
-contain the covered work, unless you entered into that arrangement,
-or that patent license was granted, prior to 28 March 2007.
-
-  Nothing in this License shall be construed as excluding or limiting
-any implied license or other defenses to infringement that may
-otherwise be available to you under applicable patent law.
-
-  12. No Surrender of Others' Freedom.
-
-  If conditions are imposed on you (whether by court order, agreement or
-otherwise) that contradict the conditions of this License, they do not
-excuse you from the conditions of this License.  If you cannot convey a
-covered work so as to satisfy simultaneously your obligations under this
-License and any other pertinent obligations, then as a consequence you may
-not convey it at all.  For example, if you agree to terms that obligate you
-to collect a royalty for further conveying from those to whom you convey
-the Program, the only way you could satisfy both those terms and this
-License would be to refrain entirely from conveying the Program.
-
-  13. Use with the GNU Affero General Public License.
-
-  Notwithstanding any other provision of this License, you have
-permission to link or combine any covered work with a work licensed
-under version 3 of the GNU Affero General Public License into a single
-combined work, and to convey the resulting work.  The terms of this
-License will continue to apply to the part which is the covered work,
-but the special requirements of the GNU Affero General Public License,
-section 13, concerning interaction through a network will apply to the
-combination as such.
-
-  14. Revised Versions of this License.
-
-  The Free Software Foundation may publish revised and/or new versions of
-the GNU General Public License from time to time.  Such new versions will
-be similar in spirit to the present version, but may differ in detail to
-address new problems or concerns.
-
-  Each version is given a distinguishing version number.  If the
-Program specifies that a certain numbered version of the GNU General
-Public License "or any later version" applies to it, you have the
-option of following the terms and conditions either of that numbered
-version or of any later version published by the Free Software
-Foundation.  If the Program does not specify a version number of the
-GNU General Public License, you may choose any version ever published
-by the Free Software Foundation.
-
-  If the Program specifies that a proxy can decide which future
-versions of the GNU General Public License can be used, that proxy's
-public statement of acceptance of a version permanently authorizes you
-to choose that version for the Program.
-
-  Later license versions may give you additional or different
-permissions.  However, no additional obligations are imposed on any
-author or copyright holder as a result of your choosing to follow a
-later version.
-
-  15. Disclaimer of Warranty.
-
-  THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY
-APPLICABLE LAW.  EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT
-HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY
-OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO,
-THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
-PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM
-IS WITH YOU.  SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF
-ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
-
-  16. Limitation of Liability.
-
-  IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
-WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS
-THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY
-GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE
-USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF
-DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD
-PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS),
-EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF
-SUCH DAMAGES.
-
-  17. Interpretation of Sections 15 and 16.
-
-  If the disclaimer of warranty and limitation of liability provided
-above cannot be given local legal effect according to their terms,
-reviewing courts shall apply local law that most closely approximates
-an absolute waiver of all civil liability in connection with the
-Program, unless a warranty or assumption of liability accompanies a
-copy of the Program in return for a fee.
-
-                     END OF TERMS AND CONDITIONS
-
-            How to Apply These Terms to Your New Programs
-
-  If you develop a new program, and you want it to be of the greatest
-possible use to the public, the best way to achieve this is to make it
-free software which everyone can redistribute and change under these terms.
-
-  To do so, attach the following notices to the program.  It is safest
-to attach them to the start of each source file to most effectively
-state the exclusion of warranty; and each file should have at least
-the "copyright" line and a pointer to where the full notice is found.
-
-    <one line to give the program's name and a brief idea of what it does.>
-    Copyright (C) <year>  <name of author>
-
-    This program is free software: you can redistribute it and/or modify
-    it under the terms of the GNU General Public License as published by
-    the Free Software Foundation, either version 3 of the License, or
-    (at your option) any later version.
-
-    This program is distributed in the hope that it will be useful,
-    but WITHOUT ANY WARRANTY; without even the implied warranty of
-    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-    GNU General Public License for more details.
-
-    You should have received a copy of the GNU General Public License
-    along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-Also add information on how to contact you by electronic and paper mail.
-
-  If the program does terminal interaction, make it output a short
-notice like this when it starts in an interactive mode:
-
-    <program>  Copyright (C) <year>  <name of author>
-    This program comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
-    This is free software, and you are welcome to redistribute it
-    under certain conditions; type `show c' for details.
-
-The hypothetical commands `show w' and `show c' should show the appropriate
-parts of the General Public License.  Of course, your program's commands
-might be different; for a GUI interface, you would use an "about box".
-
-  You should also get your employer (if you work as a programmer) or school,
-if any, to sign a "copyright disclaimer" for the program, if necessary.
-For more information on this, and how to apply and follow the GNU GPL, see
-<http://www.gnu.org/licenses/>.
-
-  The GNU General Public License does not permit incorporating your program
-into proprietary programs.  If your program is a subroutine library, you
-may consider it more useful to permit linking proprietary applications with
-the library.  If this is what you want to do, use the GNU Lesser General
-Public License instead of this License.  But first, please read
-<http://www.gnu.org/philosophy/why-not-lgpl.html>.
diff --git a/pyproject.toml b/pyproject.toml
index 4ffab2e..d219808 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "casparser"
-description = "(Karvy/Kfintech/CAMS) Consolidated Account Statement (CAS) PDF parser"
+description = "(CAMS/KFintech/NSDL/CDSL) Consolidated Account Statement (CAS) PDF parser"
 authors = [{ name = "Sandeep Somasekharan", email = "codereverser@gmail.com" }]
 requires-python = ">=3.11"
 readme = "README.md"
@@ -16,19 +16,18 @@ classifiers = [
 ]
 dependencies = [
     "casparser-isin>=2026.5.1",
-    "click>=8.0,<9.0",
+    "click>=8.0,<10",
     "colorama>=0.4.6,<1",
-    "pdfminer.six>=20240706",
+    # pypdfium2 ships a vendored C lib; we use the raw ctypes surface
+    # (FPDFText_GetCharOrigin etc.), so cap a major ahead to catch
+    # breaking ABI bumps before they hit users.
+    "pypdfium2>=5.0,<7",
     "python-dateutil>=2.8.2,<3",
     "rich>=13.5.2,<16",
     "pydantic>=2.3.0,<3",
 ]
 dynamic = ["version"]
 
-[project.optional-dependencies]
-mupdf = ["PyMuPDF>=1.25.0"]
-fast = ["PyMuPDF>=1.25.0"]
-
 [project.urls]
 Homepage = "https://github.com/codereverser/casparser"
 
@@ -37,10 +36,10 @@ casparser = "casparser.cli:cli"
 
 [dependency-groups]
 dev = [
-    "coverage[toml]>=7.3.0,<8",
-    "ipython>=8.31.0,<9",
+    "coverage[toml]>=7.3.0,<9",
+    "ipython>=8.31.0",
     "pytest>=8.0.0,<10",
-    "pytest-cov~=6.0.0",
+    "pytest-cov>=6.0,<8",
     "pre-commit>=4.0.0,<5",
 ]
 
diff --git a/tests/_assertions.py b/tests/_assertions.py
new file mode 100644
index 0000000..64f30bc
--- /dev/null
+++ b/tests/_assertions.py
@@ -0,0 +1,254 @@
+"""Invariant helpers shared across the e2e test suite.
+
+Each assertion checks a structural / arithmetic property of a parsed
+CAS object — designed so the test files can lock in correctness
+without encoding the real rupee figures from private fixtures.
+
+Examples of what these catch:
+  - Column-swap bugs   (qty * price != value)
+  - Decimal-parse bugs (comma stripped wrong)
+  - Routing bugs       (a bond row entering equities list)
+  - Anchor-drift bugs  (units cell read as 0)
+
+Tolerances are deliberately small — these are bookkeeping numbers from
+the CAS itself, so the rounding error is bounded by how the source
+statement rounds.
+"""
+
+from __future__ import annotations
+
+import re
+from decimal import Decimal
+
+# 1 paisa absolute slop is enough — these numbers come from the CAS as
+# already-rounded printed figures, so we expect exact equality but
+# leave a hair-thin epsilon for Decimal arithmetic noise.
+ABS_TOL = Decimal("0.01")
+
+# 0.5% relative tolerance on derived figures (qty * nav vs value).
+# CAS issuers truncate NAVs at 4dp and units at 3dp, so per-row
+# rounding can land 5–10 paise off on a ₹5L scheme without indicating
+# a parser bug.
+REL_TOL = Decimal("0.005")
+
+# Indian PAN format: 5 letters, 4 digits, 1 letter.
+PAN_RE = re.compile(r"^[A-Z]{5}[0-9]{4}[A-Z]$")
+
+
+def _D(x) -> Decimal:
+    return Decimal(str(x))
+
+
+def assert_relclose(actual, expected, tol: Decimal = REL_TOL, *, label: str = ""):
+    """abs(actual - expected) / abs(expected) <= tol (or absolute slop
+    when expected == 0)."""
+    a, e = _D(actual), _D(expected)
+    if e == 0:
+        assert abs(a) <= ABS_TOL, f"{label}: expected ~0, got {a}"
+        return
+    rel = abs(a - e) / abs(e)
+    assert rel <= tol, f"{label}: {a} vs {e}, rel_diff={rel:.4%} > {tol:.4%}"
+
+
+# ----------------------------------------------------------------- CAMS/KFin
+def assert_scheme_well_formed(scheme):
+    """Schemes must always carry ISIN + AMFI + a positive valuation
+    (the v1.0 parser populates both via casparser-isin)."""
+    assert scheme.isin, f"scheme {scheme.scheme!r}: no ISIN"
+    assert scheme.amfi, f"scheme {scheme.scheme!r}: no AMFI"
+    assert scheme.rta_code, f"scheme {scheme.scheme!r}: no rta_code"
+    assert scheme.valuation is not None
+    assert _D(scheme.valuation.nav) > 0, f"scheme {scheme.scheme!r}: zero/negative NAV"
+
+
+def assert_scheme_valuation_arithmetic(scheme):
+    """`close_balance * valuation.nav` should reproduce
+    `valuation.value` to within rounding error.
+
+    Catches a swapped or misread NAV / value column."""
+    close = _D(scheme.close)
+    if close == 0:
+        # Fully redeemed schemes legitimately have value = 0.
+        assert (
+            _D(scheme.valuation.value) == 0
+        ), f"scheme {scheme.scheme!r}: close=0 but value={scheme.valuation.value}"
+        return
+    derived = close * _D(scheme.valuation.nav)
+    assert_relclose(
+        derived,
+        scheme.valuation.value,
+        label=f"scheme {scheme.scheme!r}: close*nav vs value",
+    )
+
+
+def assert_scheme_transaction_units_close(scheme):
+    """`open + Σ(txn.units) == close` (exact to 3-decimal-place
+    precision, matching how CAS issuers report unit balances).
+
+    This is the strongest correctness check on the transaction
+    history: every txn that changes units must be captured. A
+    missed purchase, misread date, dropped redemption, or merged
+    duplicate row breaks the equality.
+
+    Stamp-duty and STT entries don't carry units (``t.units is
+    None``) so they're skipped here — they only deduct from the
+    cash side, not the unit balance.
+    """
+    o = _D(scheme.open)
+    c = _D(scheme.close)
+    sum_u = sum(
+        (_D(t.units) for t in scheme.transactions if t.units is not None),
+        _D(0),
+    )
+    diff = abs(o + sum_u - c)
+    assert diff <= _D("0.001"), (
+        f"scheme {scheme.scheme!r}: open={o} + Σ(units)={sum_u} " f"!= close={c} (diff={diff})"
+    )
+
+
+def assert_folio_well_formed(folio):
+    assert PAN_RE.match(
+        folio.PAN or ""
+    ), f"folio {folio.folio!r}: PAN {folio.PAN!r} fails {PAN_RE.pattern}"
+    assert folio.amc, f"folio {folio.folio!r}: empty AMC"
+    assert folio.schemes, f"folio {folio.folio!r}: no schemes"
+
+
+def assert_investor_info_complete(info):
+    """CAMS/KFin investor info: every field is populated."""
+    assert info.name, "investor: missing name"
+    assert info.email, "investor: missing email"
+    assert info.mobile, "investor: missing mobile"
+    assert info.address, "investor: missing address"
+
+
+# ----------------------------------------------------------------- NSDL/CDSL
+ISIN_EQ_RE = re.compile(r"^IN[E9][0-9A-Z]{8}\d$")
+ISIN_MF_RE = re.compile(r"^INF[0-9A-Z]{8}\d$")
+ISIN_ANY_RE = re.compile(r"^[A-Z]{2}[0-9A-Z]{9}\d$")
+
+
+def assert_equity_well_formed(eq):
+    """Every NSDL/CDSL equity row carries a well-formed ISIN.
+
+    Lapsed rights entitlements / fully-redeemed positions show up
+    with num_shares=0 and value=0 — those are valid informational
+    rows, not parser failures, so the invariant only asserts
+    consistency: when value > 0 the row must also have a positive
+    price and quantity, and vice versa.
+
+    The harder per-row invariant (`num_shares * price == value`)
+    is intentionally *not* enforced — some NSDL summary rows
+    inline a 'of which Pledged' note that confuses the quantity
+    column. The account-level Σ(value) == balance check covers
+    the misrouted-row case, which is the more dangerous one.
+    """
+    assert ISIN_ANY_RE.match(eq.isin or ""), f"equity: bad ISIN {eq.isin!r}"
+    assert _D(eq.value) >= 0, f"equity {eq.isin}: negative value"
+    assert _D(eq.price) >= 0, f"equity {eq.isin}: negative price"
+    assert _D(eq.num_shares) >= 0, f"equity {eq.isin}: negative shares"
+    if _D(eq.value) > 0:
+        assert _D(eq.price) > 0, f"equity {eq.isin}: positive value {eq.value} but zero price"
+
+
+def assert_mutual_fund_well_formed(mf):
+    """Every NSDL/CDSL MF holding has an INF ISIN and obeys
+    `balance * nav ≈ value`.
+
+    Fully-redeemed schemes legitimately show with balance=0 and
+    value=0; in that case we only verify the ISIN is well-formed
+    and that no value > 0 sneaks in without a positive balance/nav.
+
+    Otherwise this is the strongest per-row invariant for the MF
+    Holdings detailed table — catches the anchor-drift case where
+    the units cell falls outside its expected x-band and balance
+    reads as 0 while value stays correct.
+    """
+    assert ISIN_MF_RE.match(mf.isin or ""), f"MF: bad ISIN {mf.isin!r}"
+    assert _D(mf.value) >= 0, f"MF {mf.isin}: negative value"
+    assert _D(mf.balance) >= 0, f"MF {mf.isin}: negative balance"
+    if _D(mf.value) == 0:
+        # Fully-redeemed — balance must also be 0, NAV may be any value.
+        assert _D(mf.balance) == 0, f"MF {mf.isin}: value=0 but balance={mf.balance}"
+        return
+    assert _D(mf.nav) > 0, f"MF {mf.isin}: zero NAV with positive value"
+    derived = _D(mf.balance) * _D(mf.nav)
+    assert_relclose(
+        derived,
+        mf.value,
+        label=f"MF {mf.isin}: balance*nav vs value",
+    )
+
+
+def assert_bond_summary_form(bd):
+    """Summary-form bonds (NSDL-account pages) carry full metadata
+    and obey `num_bonds * face_value == value` exactly."""
+    assert ISIN_ANY_RE.match(bd.isin or ""), f"bond: bad ISIN {bd.isin!r}"
+    assert bd.face_value is not None, f"bond {bd.isin}: missing face_value"
+    assert bd.coupon_rate is not None, f"bond {bd.isin}: missing coupon_rate"
+    assert bd.coupon_frequency, f"bond {bd.isin}: missing coupon_frequency"
+    assert bd.maturity_date, f"bond {bd.isin}: missing maturity_date"
+    # Summary form doesn't carry market price.
+    assert bd.market_price is None, f"bond {bd.isin}: unexpected market_price on summary row"
+    derived = _D(bd.num_bonds) * _D(bd.face_value)
+    assert derived == _D(
+        bd.value
+    ), f"bond {bd.isin}: num_bonds*face_value={derived} != value={bd.value}"
+
+
+def assert_bond_detailed_form(bd):
+    """Detailed-form bonds (CDSL-account pages) carry only quantity,
+    market price and value — no coupon metadata."""
+    assert ISIN_ANY_RE.match(bd.isin or ""), f"bond: bad ISIN {bd.isin!r}"
+    assert bd.market_price is not None, f"bond {bd.isin}: missing market_price"
+    assert bd.face_value is None, f"bond {bd.isin}: unexpected face_value on detailed row"
+    assert bd.coupon_rate is None, f"bond {bd.isin}: unexpected coupon_rate on detailed row"
+    derived = _D(bd.num_bonds) * _D(bd.market_price)
+    assert_relclose(
+        derived,
+        bd.value,
+        label=f"bond {bd.isin}: num_bonds*market_price vs value",
+    )
+
+
+def assert_account_balance_closes(account):
+    """Σ(equity.value) + Σ(mf.value) + Σ(bond.value) == account.balance.
+
+    The strongest holding-level invariant for NSDL/CDSL: if a row was
+    misrouted between sections (e.g. a bond counted as an equity)
+    this sum still matches because the value column is the same;
+    if a row was DROPPED, the sum falls short.
+    """
+    eq = sum((_D(e.value) for e in account.equities), Decimal(0))
+    mf = sum((_D(m.value) for m in account.mutual_funds), Decimal(0))
+    bd = sum((_D(b.value) for b in account.bonds), Decimal(0))
+    derived = eq + mf + bd
+    diff = abs(derived - _D(account.balance))
+    assert diff <= ABS_TOL, (
+        f"account {account.type!r} dp={account.dp_id or '-'} cl={account.client_id or '-'}: "
+        f"Σ(values)={derived}  balance={account.balance}  diff={diff}"
+    )
+
+
+def assert_demat_account_well_formed(account):
+    """A NSDL/CDSL demat account has at least one named owner, plus
+    DP/Client IDs in the expected formats."""
+    assert account.type in (
+        "NSDL Demat Account",
+        "CDSL Demat Account",
+        "Mutual Fund Folios",
+    ), f"account: unexpected type {account.type!r}"
+    if account.type == "NSDL Demat Account":
+        # NSDL DP IDs look like 'IN######' (IN + 6 digits).
+        assert re.match(
+            r"^IN\d{6}$", account.dp_id or ""
+        ), f"NSDL demat: bad DP ID {account.dp_id!r}"
+        # Client IDs are 8-digit.
+        assert re.match(r"^\d{8}$", account.client_id or ""), "NSDL demat: bad Client ID format"
+    elif account.type == "CDSL Demat Account":
+        # CDSL DP IDs are 8-digit numerics.
+        assert re.match(r"^\d{8}$", account.dp_id or ""), "CDSL demat: bad DP ID format"
+        assert re.match(r"^\d{8}$", account.client_id or ""), "CDSL demat: bad Client ID format"
+    else:
+        # Pseudo MF-Folios account has no DP/Client.
+        assert account.dp_id == "" and account.client_id == ""
diff --git a/tests/base.py b/tests/base.py
deleted file mode 100644
index 5da27b9..0000000
--- a/tests/base.py
+++ /dev/null
@@ -1,103 +0,0 @@
-import io
-import json
-import os
-import re
-
-import pytest
-from click.testing import CliRunner
-
-from casparser import read_cas_pdf
-from casparser.enums import CASFileType
-from casparser.exceptions import CASParseError, IncorrectPasswordError
-
-
-class BaseTestClass:
-    """Common test cases for all available parsers."""
-
-    ansi_cleaner = re.compile(r"\x1b\[([0-9,A-Z]{1,2}(;[0-9]{1,2})?(;[0-9]{3})?)?[m|K]?")
-
-    @classmethod
-    def setup_class(cls):
-        cls.cams_file_name = os.getenv("CAMS_CAS_FILE")
-        cls.new_cams_file_name = os.getenv("CAMS_CAS_FILE_NEW")
-        cls.cams_summary_file_name = os.getenv("CAMS_CAS_SUMMARY")
-        cls.kfintech_summary_file_name = os.getenv("KFINTECH_CAS_SUMMARY")
-        cls.kfintech_file_name = os.getenv("KFINTECH_CAS_FILE")
-        cls.new_kfintech_file_name = os.getenv("KFINTECH_CAS_FILE_NEW")
-        cls.bad_file_name = os.getenv("BAD_CAS_FILE")
-        cls.cams_password = os.getenv("CAMS_CAS_PASSWORD")
-        cls.kfintech_password = os.getenv("KFINTECH_CAS_PASSWORD")
-        cls.nsdl_file_name = os.getenv("NSDL_CAS_FILE_1")
-
-        cls.pdf_files = [
-            (cls.cams_file_name, cls.cams_password, 10, 14),
-            (cls.new_cams_file_name, cls.cams_password, 14, 30),
-            (cls.kfintech_file_name, cls.kfintech_password, 17, 30),
-            (cls.new_kfintech_file_name, cls.kfintech_password, 14, 30),
-        ]
-
-    def read_pdf(self, filename, password, output="dict"):
-        return read_cas_pdf(filename, password, output=output)
-
-    def test_output_json(self):
-        for filename, password, num_folios, _ in self.pdf_files:
-            json_data = self.read_pdf(filename, password, output="json")
-            data = json.loads(json_data)
-            assert (
-                len(data.get("folios", [])) == num_folios
-            ), f"Expected : {num_folios} :: Got {len(data.get('folios', []))}"
-            for folio in data["folios"]:
-                assert isinstance(folio["PAN"], str) and len(folio["PAN"]) == 10
-                for scheme in folio.get("schemes", []):
-                    assert scheme["isin"] is not None
-                    assert scheme["amfi"] is not None
-                    assert scheme["advisor"] not in (None, "ARN")
-            assert data.get("investor_info", {}).get("mobile") not in (None, "")
-            assert data["cas_type"] == CASFileType.DETAILED.value
-
-    def test_read_summary(self):
-        summary_files = (
-            (self.cams_summary_file_name, self.cams_password, 4, 6),
-            (self.kfintech_summary_file_name, self.kfintech_password, 9, 13),
-        )
-        for filename, password, num_folios, num_schemes in summary_files:
-            data = self.read_pdf(filename, password)
-            assert len(data.folios) == num_folios
-            schemes_found = 0
-            for folio in data.folios:
-                schemes_found += len(folio.schemes)
-                for scheme in folio.schemes:
-                    assert scheme.isin is not None
-                    assert scheme.amfi is not None
-            assert schemes_found == num_schemes
-            assert data.investor_info.mobile not in (None, "")
-            assert data.cas_type == CASFileType.SUMMARY.value
-
-    def test_read_dict(self):
-        from casparser.cli import cli
-
-        runner = CliRunner()
-
-        for pdf_file, pdf_password, _, num_schemes in self.pdf_files:
-            args = [pdf_file, "-p", pdf_password, "-a"]
-            result = runner.invoke(cli, args)
-            assert result.exit_code == 0
-            clean_output = self.ansi_cleaner.sub("", result.output)
-            assert "Statement Period :" in clean_output
-            assert re.search(rf"Matched\s+:\s+{num_schemes}\s+schemes", clean_output) is not None
-            assert re.search(r"Error\s+:\s+0\s+schemes", clean_output) is not None
-
-    def test_invalid_password(self):
-        with pytest.raises(IncorrectPasswordError) as exc_info:
-            self.read_pdf(self.cams_file_name, "")
-        assert "Incorrect PDF password!" in str(exc_info)
-
-    def test_invalid_file(self):
-        with pytest.raises(CASParseError) as exc_info, io.BytesIO(b"test") as fp:
-            self.read_pdf(fp, "")
-        assert "Unhandled error while opening" in str(exc_info)
-
-    def test_invalid_file_type(self):
-        with pytest.raises(CASParseError) as exc_info:
-            self.read_pdf(1, "")
-        assert "Invalid input" in str(exc_info)
diff --git a/tests/conftest.py b/tests/conftest.py
index 35cd279..18916d8 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -1,4 +1,170 @@
+"""Shared pytest fixtures for the e2e suite.
+
+Each fixture skips its dependent tests when the corresponding env
+var isn't set, so contributors without the encrypted sample bundle
+can still run unit-level tests. The PDFs themselves are parsed once
+per module via the `*_data` fixtures to keep wall-time low.
+
+The encrypted fixtures (`tests/files.enc`) are decoded into
+`tests/files/` by `.github/scripts/extract_files.sh` on CI; locally,
+the same files live in `tests/files/` for tests that don't need a
+password (`nsdl_statement_1.pdf`) and the rest are skipped.
+"""
+
+from __future__ import annotations
+
+import os
+import re
+
 import pytest
 
-# Rewrite asserts in base test class
-pytest.register_assert_rewrite("tests.base")
+# Make assertion-rewriting work for the shared invariant helpers, so
+# failed assertions inside `_assertions.assert_*` show useful diffs
+# instead of bare `AssertionError`.
+pytest.register_assert_rewrite("tests._assertions")
+
+
+# ANSI escape stripper used by CLI tests to make output assertions
+# robust against `rich`-coloured TTY runs.
+ANSI_RE = re.compile(r"\x1b\[([0-9,A-Z]{1,2}(;[0-9]{1,2})?(;[0-9]{3})?)?[m|K]?")
+
+
+def strip_ansi(s: str) -> str:
+    return ANSI_RE.sub("", s)
+
+
+def _required_env(var: str) -> str:
+    val = os.getenv(var)
+    if not val:
+        pytest.skip(f"environment variable {var} not set")
+    return val
+
+
+# --- passwords --------------------------------------------------------------
+
+
+@pytest.fixture(scope="session")
+def cams_password() -> str:
+    return _required_env("CAMS_CAS_PASSWORD")
+
+
+@pytest.fixture(scope="session")
+def kfin_password() -> str:
+    return _required_env("KFINTECH_CAS_PASSWORD")
+
+
+@pytest.fixture(scope="session")
+def cdsl_password() -> str:
+    # CDSL_CAS_PASSWORD may legitimately be empty for some samples.
+    return os.getenv("CDSL_CAS_PASSWORD", "")
+
+
+# --- file paths (skip on missing env var) -----------------------------------
+
+
+@pytest.fixture(scope="session")
+def cams_file() -> str:
+    return _required_env("CAMS_CAS_FILE")
+
+
+@pytest.fixture(scope="session")
+def cams_file_new() -> str:
+    return _required_env("CAMS_CAS_FILE_NEW")
+
+
+@pytest.fixture(scope="session")
+def cams_summary_file() -> str:
+    return _required_env("CAMS_CAS_SUMMARY")
+
+
+@pytest.fixture(scope="session")
+def kfin_file() -> str:
+    return _required_env("KFINTECH_CAS_FILE")
+
+
+@pytest.fixture(scope="session")
+def kfin_file_new() -> str:
+    return _required_env("KFINTECH_CAS_FILE_NEW")
+
+
+@pytest.fixture(scope="session")
+def kfin_summary_file() -> str:
+    return _required_env("KFINTECH_CAS_SUMMARY")
+
+
+@pytest.fixture(scope="session")
+def nsdl_file() -> str:
+    return _required_env("NSDL_CAS_FILE_1")
+
+
+@pytest.fixture(scope="session")
+def cdsl_file() -> str:
+    return _required_env("CDSL_CAS_FILE_1")
+
+
+@pytest.fixture(scope="session")
+def bad_file() -> str:
+    return _required_env("BAD_CAS_FILE")
+
+
+# --- parsed-data fixtures (one parse per module) ----------------------------
+#
+# Each `*_data` fixture parses its PDF exactly once per pytest module,
+# so per-issuer test files share the work across their methods.
+
+
+@pytest.fixture(scope="module")
+def cams_data(cams_file, cams_password):
+    from casparser import read_cas_pdf
+
+    return read_cas_pdf(cams_file, cams_password)
+
+
+@pytest.fixture(scope="module")
+def cams_new_data(cams_file_new, cams_password):
+    from casparser import read_cas_pdf
+
+    return read_cas_pdf(cams_file_new, cams_password)
+
+
+@pytest.fixture(scope="module")
+def cams_summary_data(cams_summary_file, cams_password):
+    from casparser import read_cas_pdf
+
+    return read_cas_pdf(cams_summary_file, cams_password)
+
+
+@pytest.fixture(scope="module")
+def kfin_data(kfin_file, kfin_password):
+    from casparser import read_cas_pdf
+
+    return read_cas_pdf(kfin_file, kfin_password)
+
+
+@pytest.fixture(scope="module")
+def kfin_new_data(kfin_file_new, kfin_password):
+    from casparser import read_cas_pdf
+
+    return read_cas_pdf(kfin_file_new, kfin_password)
+
+
+@pytest.fixture(scope="module")
+def kfin_summary_data(kfin_summary_file, kfin_password):
+    from casparser import read_cas_pdf
+
+    return read_cas_pdf(kfin_summary_file, kfin_password)
+
+
+@pytest.fixture(scope="module")
+def nsdl_data(nsdl_file):
+    from casparser import read_cas_pdf
+
+    # NSDL_CAS_FILE_1 in the current bundle is not password-protected.
+    return read_cas_pdf(nsdl_file, "")
+
+
+@pytest.fixture(scope="module")
+def cdsl_data(cdsl_file, cdsl_password):
+    from casparser import read_cas_pdf
+
+    return read_cas_pdf(cdsl_file, cdsl_password)
diff --git a/tests/files.enc b/tests/files.enc
index 249e5ef..4bd6ce1 100644
Binary files a/tests/files.enc and b/tests/files.enc differ
diff --git a/tests/pytest.ini b/tests/pytest.ini
deleted file mode 100644
index e69de29..0000000
diff --git a/tests/test_cams.py b/tests/test_cams.py
new file mode 100644
index 0000000..e0d4cb5
--- /dev/null
+++ b/tests/test_cams.py
@@ -0,0 +1,218 @@
+"""End-to-end tests for CAMS CAS files.
+
+Two detailed fixtures (`CAMS_CAS_FILE` short-period + `CAMS_CAS_FILE_NEW`
+multi-decade) plus a summary fixture (`CAMS_CAS_SUMMARY`). Each test
+parses one fixture via a module-scoped fixture in `conftest.py`.
+
+Assertions cover:
+  * Exact folio + scheme counts (regression guard for schema-detection)
+  * Schema-level invariants: ISIN/AMFI/RTA populated, PAN well-formed,
+    valuation.nav > 0
+  * Arithmetic invariant `close * valuation.nav ≈ valuation.value`
+    (catches column-swap and decimal-parse bugs without encoding
+    rupee figures from the private fixture)
+"""
+
+from __future__ import annotations
+
+import json
+
+from click.testing import CliRunner
+
+from casparser.enums import CASFileType
+
+from ._assertions import (
+    assert_folio_well_formed,
+    assert_investor_info_complete,
+    assert_scheme_transaction_units_close,
+    assert_scheme_valuation_arithmetic,
+    assert_scheme_well_formed,
+)
+
+# Exact fixture shape (folios, schemes) — locked in to catch any
+# regression in header / footer / table-boundary detection.
+DETAILED = {
+    "main": dict(folios=10, schemes=14, period_from="01-Apr-2018", period_to="30-Jun-2018"),
+    "new": dict(folios=14, schemes=30, period_from="01-Jan-2000", period_to="31-Aug-2023"),
+}
+SUMMARY = dict(folios=4, schemes=6)
+
+
+# --- detailed -------------------------------------------------------------
+
+
+class TestCAMSDetailed:
+    """Short-period CAMS DETAILED statement (`CAMS_CAS_FILE`)."""
+
+    def test_shape(self, cams_data):
+        d = cams_data
+        assert d.file_type == "CAMS"
+        assert d.cas_type == CASFileType.DETAILED.value
+        assert d.statement_period.from_ == DETAILED["main"]["period_from"]
+        assert d.statement_period.to == DETAILED["main"]["period_to"]
+        assert len(d.folios) == DETAILED["main"]["folios"]
+        total_schemes = sum(len(f.schemes) for f in d.folios)
+        assert total_schemes == DETAILED["main"]["schemes"]
+
+    def test_investor_info(self, cams_data):
+        assert_investor_info_complete(cams_data.investor_info)
+
+    def test_every_folio_well_formed(self, cams_data):
+        for folio in cams_data.folios:
+            assert_folio_well_formed(folio)
+
+    def test_every_scheme_well_formed(self, cams_data):
+        for folio in cams_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_well_formed(scheme)
+
+    def test_close_times_nav_equals_valuation(self, cams_data):
+        """`scheme.close * scheme.valuation.nav` reproduces
+        `scheme.valuation.value` for every scheme."""
+        for folio in cams_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_valuation_arithmetic(scheme)
+
+    def test_open_plus_units_equals_close(self, cams_data):
+        """`scheme.open + Σ(txn.units) == scheme.close` exactly for
+        every scheme. Catches dropped / mis-dated / duplicated
+        transactions on the unit side."""
+        for folio in cams_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_transaction_units_close(scheme)
+
+    def test_json_output(self, cams_file, cams_password):
+        """JSON serialization round-trip preserves the schema."""
+        from casparser import read_cas_pdf
+
+        raw = read_cas_pdf(cams_file, cams_password, output="json")
+        data = json.loads(raw)
+        assert data["file_type"] == "CAMS"
+        assert data["cas_type"] == CASFileType.DETAILED.value
+        assert len(data["folios"]) == DETAILED["main"]["folios"]
+        # Every scheme keeps its ISIN/AMFI through JSON serialization.
+        for f in data["folios"]:
+            for s in f["schemes"]:
+                assert s["isin"], f"JSON: scheme without ISIN: {s['scheme']!r}"
+                assert s["amfi"], f"JSON: scheme without AMFI: {s['scheme']!r}"
+
+
+class TestCAMSDetailedNew:
+    """Multi-decade CAMS DETAILED statement (`CAMS_CAS_FILE_NEW`)."""
+
+    def test_shape(self, cams_new_data):
+        d = cams_new_data
+        assert d.file_type == "CAMS"
+        assert d.cas_type == CASFileType.DETAILED.value
+        assert d.statement_period.from_ == DETAILED["new"]["period_from"]
+        assert d.statement_period.to == DETAILED["new"]["period_to"]
+        assert len(d.folios) == DETAILED["new"]["folios"]
+        total_schemes = sum(len(f.schemes) for f in d.folios)
+        assert total_schemes == DETAILED["new"]["schemes"]
+
+    def test_every_scheme_well_formed(self, cams_new_data):
+        for folio in cams_new_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_well_formed(scheme)
+
+    def test_close_times_nav_equals_valuation(self, cams_new_data):
+        for folio in cams_new_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_valuation_arithmetic(scheme)
+
+    def test_open_plus_units_equals_close(self, cams_new_data):
+        for folio in cams_new_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_transaction_units_close(scheme)
+
+
+# --- summary --------------------------------------------------------------
+
+
+class TestCAMSSummary:
+    """CAMS SUMMARY statement (`CAMS_CAS_SUMMARY`)."""
+
+    def test_shape(self, cams_summary_data):
+        d = cams_summary_data
+        assert d.file_type == "CAMS"
+        assert d.cas_type == CASFileType.SUMMARY.value
+        assert len(d.folios) == SUMMARY["folios"]
+        total_schemes = sum(len(f.schemes) for f in d.folios)
+        assert total_schemes == SUMMARY["schemes"]
+
+    def test_investor_info(self, cams_summary_data):
+        assert_investor_info_complete(cams_summary_data.investor_info)
+
+    def test_every_scheme_well_formed(self, cams_summary_data):
+        for folio in cams_summary_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_well_formed(scheme)
+
+    def test_close_times_nav_equals_valuation(self, cams_summary_data):
+        for folio in cams_summary_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_valuation_arithmetic(scheme)
+
+
+# --- CLI ------------------------------------------------------------------
+
+
+class TestCAMSCLI:
+    """One CLI invocation per output format proves the wiring still works.
+
+    Detailed assertion of CLI semantics for other issuers is covered
+    in their own files; this file owns the CAMS-specific paths
+    (default JSON, CSV detailed, summary CSV, `-s` summary table)."""
+
+    def test_default_invocation(self, tmp_path, cams_file, cams_password):
+        from casparser.cli import cli
+
+        out = tmp_path / "out.json"
+        result = CliRunner().invoke(
+            cli,
+            [cams_file, "-p", cams_password, "-o", str(out)],
+        )
+        assert result.exit_code == 0, result.output
+        assert "File saved" in result.output
+        payload = json.loads(out.read_text())
+        assert payload["file_type"] == "CAMS"
+
+    def test_csv_output(self, tmp_path, cams_file, cams_password):
+        from casparser.cli import cli
+
+        out = tmp_path / "out.csv"
+        result = CliRunner().invoke(
+            cli,
+            [cams_file, "-p", cams_password, "-o", str(out)],
+        )
+        assert result.exit_code == 0, result.output
+        assert "File saved" in result.output
+        # cas2csv columns
+        content = out.read_text()
+        for col in ("amc", "folio", "isin", "amfi", "scheme"):
+            assert col in content, f"missing CSV column {col!r}"
+
+    def test_summary_csv_output(self, tmp_path, cams_file, cams_password):
+        """`-s -o file.csv` writes the SUMMARY-format CSV (covers
+        `cas2csv_summary`)."""
+        from casparser.cli import cli
+
+        out = tmp_path / "summary.csv"
+        result = CliRunner().invoke(
+            cli,
+            [cams_file, "-p", cams_password, "-s", "-o", str(out)],
+        )
+        assert result.exit_code == 0
+        content = out.read_text()
+        for col in ("amc", "folio", "isin", "amfi", "scheme"):
+            assert col in content, f"missing summary CSV column {col!r}"
+
+    def test_summary_terminal_output(self, cams_file, cams_password):
+        """CLI without `-o` renders a rich table to the terminal."""
+        from casparser.cli import cli
+        from tests.conftest import strip_ansi
+
+        result = CliRunner().invoke(cli, [cams_file, "-p", cams_password, "-a"])
+        assert result.exit_code == 0
+        clean = strip_ansi(result.output)
+        assert "Statement Period :" in clean
diff --git a/tests/test_cdsl.py b/tests/test_cdsl.py
new file mode 100644
index 0000000..e44b5bb
--- /dev/null
+++ b/tests/test_cdsl.py
@@ -0,0 +1,106 @@
+"""End-to-end tests for CDSL CAS statements.
+
+Single password-protected fixture (`CDSL_CAS_FILE_1` + `CDSL_CAS_PASSWORD`).
+The statement carries a CDSL demat account, an NSDL demat account
+(yes, CDSL CAS files can contain NSDL accounts as cross-references),
+and a Mutual Fund Folios pseudo-account.
+"""
+
+from __future__ import annotations
+
+import json
+
+from click.testing import CliRunner
+
+from ._assertions import (
+    assert_account_balance_closes,
+    assert_demat_account_well_formed,
+    assert_equity_well_formed,
+    assert_mutual_fund_well_formed,
+)
+
+EXPECTED_ACCOUNTS = 3
+
+EXPECTED_PER_ACCOUNT = [
+    # (type, equities, mutual_funds, bonds)
+    ("CDSL Demat Account", 25, 1, 0),
+    ("NSDL Demat Account", 2, 0, 0),
+    ("Mutual Fund Folios", 0, 16, 0),
+]
+
+PERIOD_FROM = "01-Apr-2025"
+PERIOD_TO = "31-Mar-2026"
+
+
+class TestCDSLStatement:
+    def test_file_type_and_period(self, cdsl_data):
+        assert cdsl_data.file_type == "CDSL"
+        assert cdsl_data.statement_period.from_ == PERIOD_FROM
+        assert cdsl_data.statement_period.to == PERIOD_TO
+
+    def test_account_count(self, cdsl_data):
+        assert len(cdsl_data.accounts) == EXPECTED_ACCOUNTS
+
+    def test_per_account_holdings_counts(self, cdsl_data):
+        for i, (exp_type, n_eq, n_mf, n_bd) in enumerate(EXPECTED_PER_ACCOUNT):
+            ac = cdsl_data.accounts[i]
+            assert ac.type == exp_type, f"acc {i}: type {ac.type!r}"
+            assert len(ac.equities) == n_eq, (
+                f"acc {i} ({exp_type}): expected {n_eq} equities, " f"got {len(ac.equities)}"
+            )
+            assert len(ac.mutual_funds) == n_mf, (
+                f"acc {i} ({exp_type}): expected {n_mf} MFs, " f"got {len(ac.mutual_funds)}"
+            )
+            assert len(ac.bonds) == n_bd
+
+    def test_investor_name_set(self, cdsl_data):
+        assert cdsl_data.investor_info.name
+
+
+class TestCDSLAccountInvariants:
+    def test_account_well_formed(self, cdsl_data):
+        for ac in cdsl_data.accounts:
+            assert_demat_account_well_formed(ac)
+
+    def test_account_balance_closes(self, cdsl_data):
+        """Σ(equity.value) + Σ(mf.value) ≈ account.balance."""
+        for ac in cdsl_data.accounts:
+            assert_account_balance_closes(ac)
+
+    def test_equity_rows_well_formed(self, cdsl_data):
+        for ac in cdsl_data.accounts:
+            for eq in ac.equities:
+                assert_equity_well_formed(eq)
+
+    def test_mutual_fund_rows_well_formed(self, cdsl_data):
+        for ac in cdsl_data.accounts:
+            for mf in ac.mutual_funds:
+                assert_mutual_fund_well_formed(mf)
+
+
+class TestCDSLOutput:
+    """CDSL JSON output preserves the account schema."""
+
+    def test_json_output(self, cdsl_file, cdsl_password):
+        from casparser import read_cas_pdf
+
+        raw = read_cas_pdf(cdsl_file, cdsl_password, output="json")
+        data = json.loads(raw)
+        assert data["file_type"] == "CDSL"
+        assert len(data["accounts"]) == EXPECTED_ACCOUNTS
+        assert data["investor_info"]["name"]
+
+
+class TestCDSLCLI:
+    def test_cli_renders_table(self, cdsl_file, cdsl_password):
+        from casparser.cli import cli
+        from tests.conftest import strip_ansi
+
+        result = CliRunner().invoke(
+            cli,
+            [cdsl_file, "-p", cdsl_password, "-a"],
+        )
+        assert result.exit_code == 0
+        clean = strip_ansi(result.output)
+        assert "Statement Period :" in clean
+        assert "CDSL" in clean
diff --git a/tests/test_demat_units.py b/tests/test_demat_units.py
new file mode 100644
index 0000000..803b746
--- /dev/null
+++ b/tests/test_demat_units.py
@@ -0,0 +1,654 @@
+"""Unit tests for NSDL/CDSL parser helpers — exercise the corner-case
+branches that the end-to-end NSDL+CDSL fixtures don't hit (decimal
+parsing edge cases, joint-name owner block, summary-table row
+recognisers, MF holdings row anomaly handling, etc.)."""
+
+from __future__ import annotations
+
+from decimal import Decimal
+
+import pytest
+
+import casparser.parsers.cdsl as cdsl_p
+import casparser.parsers.nsdl as nsdl_p
+from casparser.parsers.pageobj import Atom, Block, Cell
+
+
+def _cell(
+    text: str, x_left: float = 0.0, x_right: float = 10.0, y_top: float = 0.0, y_bot: float = 0.0
+) -> Cell:
+    """Construct a `Cell` with one synthetic atom backing it."""
+    a = Atom(x_left, x_right, y_top, y_bot, text, "Helvetica", stream_seq=0)
+    return Cell(
+        x_left=x_left,
+        x_right=x_right,
+        y_top=y_top,
+        y_bot=y_bot,
+        text=text,
+        atoms=[a],
+    )
+
+
+def _block(*cells: Cell, page: int = 8) -> Block:
+    return Block(page=page, cells=list(cells))
+
+
+# ---------------------------------------------------------------- decimals
+
+
+class TestDecimalHelpers:
+    """Exercises NSDL + CDSL `_to_decimal` / `_opt_decimal` edge cases.
+    Both modules carry a copy of the helpers; we test both to make sure
+    the branches in each file are hit."""
+
+    @pytest.mark.parametrize("mod", [nsdl_p, cdsl_p])
+    def test_to_decimal_handles_none(self, mod):
+        assert mod._to_decimal(None) == Decimal(0)
+
+    @pytest.mark.parametrize("mod", [nsdl_p, cdsl_p])
+    @pytest.mark.parametrize("placeholder", ["", " ", "-", "--", "N.A", "NA"])
+    def test_to_decimal_handles_placeholders(self, mod, placeholder):
+        assert mod._to_decimal(placeholder) == Decimal(0)
+
+    @pytest.mark.parametrize("mod", [nsdl_p, cdsl_p])
+    def test_to_decimal_strips_commas(self, mod):
+        assert mod._to_decimal("1,23,456.78") == Decimal("123456.78")
+
+    @pytest.mark.parametrize("mod", [nsdl_p, cdsl_p])
+    def test_to_decimal_swallows_invalid(self, mod):
+        # An unparseable string falls back to 0 rather than raising.
+        assert mod._to_decimal("not a number") == Decimal(0)
+
+    @pytest.mark.parametrize("mod", [nsdl_p, cdsl_p])
+    def test_opt_decimal_returns_none_on_placeholders(self, mod):
+        assert mod._opt_decimal(None) is None
+        assert mod._opt_decimal("--") is None
+        assert mod._opt_decimal("") is None
+        assert mod._opt_decimal("garbage!") is None
+
+    @pytest.mark.parametrize("mod", [nsdl_p, cdsl_p])
+    def test_opt_decimal_parses_value(self, mod):
+        assert mod._opt_decimal("1,234.5") == Decimal("1234.5")
+
+
+# ---------------------------------------------------------------- CDSL
+
+
+class TestCDSLHelpers:
+    def test_split_bo_id_cdsl(self):
+        # All-digit BO ID → CDSL; first 8 = DP, last 8 = client.
+        assert cdsl_p._split_bo_id("1111222233334444") == (
+            "CDSL",
+            "11112222",
+            "33334444",
+        )
+
+    def test_split_bo_id_nsdl(self):
+        # NSDL DP IDs start with `IN`.
+        assert cdsl_p._split_bo_id("IN12345699998888") == (
+            "NSDL",
+            "IN123456",
+            "99998888",
+        )
+
+    def test_split_bo_id_invalid_length(self):
+        assert cdsl_p._split_bo_id("12345") == ("", "", "")
+
+    def test_split_bo_id_unrecognised(self):
+        # Doesn't start with IN and isn't all digits → can't classify.
+        assert cdsl_p._split_bo_id("ABCD123412341234") == ("", "", "")
+
+    def test_account_key_normalises(self):
+        assert cdsl_p._account_key("cdsl", " 11112222 ", "33334444 ") == (
+            "CDSL",
+            "11112222",
+            "33334444",
+        )
+
+    def test_full_type_format(self):
+        assert cdsl_p._full_type("cdsl") == "CDSL Demat Account"
+
+    def test_looks_numeric(self):
+        assert cdsl_p._looks_numeric("1,234.5")
+        assert cdsl_p._looks_numeric("-100")
+        assert not cdsl_p._looks_numeric("ARN-0005")
+        assert not cdsl_p._looks_numeric("DIRECT")
+        assert not cdsl_p._looks_numeric("")
+
+    def test_is_total_row(self):
+        block = _block(_cell("Sub Total"), _cell("100.00"))
+        assert cdsl_p._is_total_row(block)
+        block2 = _block(_cell("INE000A01001"), _cell("100"))
+        assert not cdsl_p._is_total_row(block2)
+
+    def test_is_holdings_header(self):
+        # A column-header row mentioning ISIN + Security keywords but
+        # NOT carrying an actual ISIN value.
+        block = _block(
+            _cell("ISIN"),
+            _cell("Security"),
+            _cell("Current Bal"),
+            _cell("Market Price"),
+        )
+        assert cdsl_p._is_holdings_header(block)
+        # A data row IS NOT a header.
+        data_row = _block(_cell("INE000A01001"), _cell("EXAMPLE COMPANY LIMITED"))
+        assert not cdsl_p._is_holdings_header(data_row)
+
+    def test_parse_holdings_row_rejects_no_isin(self):
+        block = _block(_cell("Not an ISIN"), _cell("name"), _cell("100"))
+        assert cdsl_p._parse_holdings_row(block) is None
+
+    def test_parse_holdings_row_skips_at_marker(self):
+        """The leading `@` marker (suspended issue) sits between ISIN
+        and name and should be skipped."""
+        block = _block(
+            _cell("INE000A01001", 20, 60),
+            _cell("@", 80, 85),
+            _cell("EXAMPLE COMPANY LIMITED", 90, 200),
+            _cell("100", 240, 270),
+            _cell("--", 300, 320),
+            _cell("--", 340, 360),
+            _cell("--", 380, 400),
+            _cell("100", 440, 460),
+            _cell("450.50", 500, 540),
+            _cell("45050.00", 560, 620),
+        )
+        row = cdsl_p._parse_holdings_row(block)
+        assert row is not None
+        isin, name, shares, price, value = row
+        assert isin == "INE000A01001"
+        assert name == "EXAMPLE COMPANY LIMITED"
+        assert shares == Decimal("100")
+        assert price == Decimal("450.50")
+        assert value == Decimal("45050.00")
+
+    def test_parse_holdings_row_all_dashes(self):
+        """Rights-entitlement rows with all-`--` balances should still
+        parse — the `data_start` finder accepts `--` as the first data
+        cell."""
+        block = _block(
+            _cell("INE000A01002", 20, 60),
+            _cell("EXAMPLE RIGHTS ENTITL", 80, 200),
+            _cell("--", 240, 260),
+            _cell("--", 300, 320),
+            _cell("--", 340, 360),
+            _cell("--", 380, 400),
+            _cell("--", 440, 460),
+            _cell("6.29", 500, 540),
+            _cell("0.00", 560, 620),
+        )
+        row = cdsl_p._parse_holdings_row(block)
+        assert row is not None
+        _, _, shares, price, value = row
+        assert shares == Decimal(0)
+        assert price == Decimal("6.29")
+        assert value == Decimal(0)
+
+    def test_parse_holdings_row_returns_none_on_short_block(self):
+        block = _block(_cell("INE000A01001"), _cell("name"), _cell("100"))
+        # Only 3 cells — fewer than the 3 trailing data cells required.
+        assert cdsl_p._parse_holdings_row(block) is None
+
+
+# ---------------------------------------------------------------- NSDL
+
+
+class TestNSDLHelpers:
+    def test_full_type_format(self):
+        assert nsdl_p._full_type("cdsl") == "CDSL Demat Account"
+        assert nsdl_p._full_type("nsdl") == "NSDL Demat Account"
+
+    def test_account_key_normalises(self):
+        assert nsdl_p._account_key("nsdl", " IN301151 ", " 12241815 ") == (
+            "NSDL",
+            "IN301151",
+            "12241815",
+        )
+
+    def test_is_total_row(self):
+        assert nsdl_p._is_total_row(_block(_cell("Sub Total"), _cell("100")))
+        assert nsdl_p._is_total_row(_block(_cell("Grand Total"), _cell("1,00,000")))
+        assert not nsdl_p._is_total_row(_block(_cell("INE000A01001")))
+
+    def test_section_marker_kind(self):
+        assert nsdl_p._section_marker_kind(_block(_cell("Equity Shares"))) == "equities"
+        assert nsdl_p._section_marker_kind(_block(_cell("Mutual Funds (M)"))) == "mfunds"
+        assert nsdl_p._section_marker_kind(_block(_cell("Corporate Bonds (C)"))) == "bonds"
+        # Unsupported markers are still recognised so we don't misroute
+        # the next data row into the previous section.
+        assert nsdl_p._section_marker_kind(_block(_cell("Preference Shares (P)"))) == "unsupported"
+        # A multi-cell row is not a marker.
+        assert (
+            nsdl_p._section_marker_kind(_block(_cell("Equity Shares"), _cell("A"), _cell("B")))
+            is None
+        )
+        # An unknown short label is not a marker.
+        assert nsdl_p._section_marker_kind(_block(_cell("Random Caption"))) is None
+
+    def test_detect_mode_from_header(self):
+        # MF Holdings table
+        mfh = _block(
+            _cell("ISIN"),
+            _cell("ISIN Description"),
+            _cell("Folio No."),
+            _cell("No. of Units"),
+            _cell("Average"),
+            _cell("Total Cost"),
+        )
+        assert nsdl_p._detect_mode_from_header(mfh) == "mf_holdings"
+        # Detailed equity table without a section hint -> equities_detailed.
+        eq_det = _block(
+            _cell("ISIN"),
+            _cell("Security"),
+            _cell("Current Bal"),
+            _cell("Market Price"),
+            _cell("Value in"),
+        )
+        assert nsdl_p._detect_mode_from_header(eq_det) == "equities_detailed"
+        # ... but the same header in a 'bonds' context routes to bonds_detailed,
+        # and in an 'mfunds' context to mfunds_detailed.
+        assert nsdl_p._detect_mode_from_header(eq_det, "bonds") == "bonds_detailed"
+        assert nsdl_p._detect_mode_from_header(eq_det, "mfunds") == "mfunds_detailed"
+        # Summary bonds table.
+        bd_sum = _block(
+            _cell("ISIN"),
+            _cell("Company Name"),
+            _cell("Coupon Rate"),
+            _cell("Frequency"),
+            _cell("Maturity Date"),
+            _cell("Face Value"),
+        )
+        assert nsdl_p._detect_mode_from_header(bd_sum) == "bonds_summary"
+        # Summary equity table
+        eq_sum = _block(
+            _cell("Stock Symbol"),
+            _cell("ISIN"),
+            _cell("Company Name"),
+        )
+        assert nsdl_p._detect_mode_from_header(eq_sum) == "equities_summary"
+        # Summary MF table
+        mf_sum = _block(
+            _cell("ISIN"),
+            _cell("ISIN Description"),
+            _cell("NAV"),
+        )
+        assert nsdl_p._detect_mode_from_header(mf_sum) == "mfunds_summary"
+        # A data row (carrying a real ISIN) is NOT a header.
+        data_row = _block(_cell("INE000A01001"), _cell("Some Stock"))
+        assert nsdl_p._detect_mode_from_header(data_row) is None
+        # A truly unrecognised row returns None.
+        unknown = _block(_cell("Foo"), _cell("Bar"))
+        assert nsdl_p._detect_mode_from_header(unknown) is None
+
+    def test_is_table_header(self):
+        # Multiple header keywords + no ISIN → header.
+        hdr = _block(
+            _cell(
+                "ISIN Description    No. of\nUnits    Stock Symbol    " "Market Price    Value in"
+            )
+        )
+        assert nsdl_p._is_table_header(hdr)
+        # Carrying an ISIN → data row, not header.
+        data_row = _block(_cell("INE000A01001 some stock"))
+        assert not nsdl_p._is_table_header(data_row)
+
+    def test_parse_equity_row_summary_format(self):
+        """Summary equity row: ISIN, name, face_value, num_shares,
+        price, value. We take the last three numerics."""
+        block = _block(
+            _cell("INE000A01001\nEXAMPLECO.NSE"),
+            _cell("EXAMPLE COMPANY LIMITED"),
+            _cell("1.00"),  # face value
+            _cell("100"),  # num_shares
+            _cell("450.50"),  # price
+            _cell("45,050.00"),  # value
+        )
+        eq = nsdl_p._parse_equity_row(block, detailed=False)
+        assert eq is not None
+        assert eq.isin == "INE000A01001"
+        assert eq.num_shares == Decimal("100")
+        assert eq.price == Decimal("450.50")
+        assert eq.value == Decimal("45050.00")
+
+    def test_parse_equity_row_detailed_format(self):
+        """Detailed equity row: 11 numerics; num_shares = first."""
+        block = _block(
+            _cell("INE000A01001"),
+            _cell("EXAMPLE COMPANY LIMITED"),
+            _cell("100"),  # current_bal = num_shares
+            _cell("100"),  # free_bal
+            _cell("0"),
+            _cell("0"),
+            _cell("0"),
+            _cell("0"),
+            _cell("0"),
+            _cell("0"),
+            _cell("0"),
+            _cell("450.50"),  # market_price
+            _cell("45,050.00"),  # value
+        )
+        eq = nsdl_p._parse_equity_row(block, detailed=True)
+        assert eq is not None
+        assert eq.num_shares == Decimal("100")
+        assert eq.price == Decimal("450.50")
+        assert eq.value == Decimal("45050.00")
+
+    def test_parse_equity_row_rejects_no_isin(self):
+        block = _block(_cell("not-an-isin"), _cell("name"), _cell("1"), _cell("2"), _cell("3"))
+        assert nsdl_p._parse_equity_row(block) is None
+
+    def test_parse_equity_row_rejects_too_few_numerics(self):
+        block = _block(_cell("INE000A01001"), _cell("name"), _cell("1"), _cell("2"))
+        assert nsdl_p._parse_equity_row(block) is None
+
+    def test_parse_summary_mf_row(self):
+        block = _block(
+            _cell("INF000A01002"),
+            _cell("NIPPON INDIA ETF LIQUID BeES"),
+            _cell("100.001"),  # units
+            _cell("1000.00"),  # NAV
+            _cell("100,000.00"),  # value
+        )
+        mf = nsdl_p._parse_summary_mf_row(block)
+        assert mf is not None
+        assert mf.isin == "INF000A01002"
+        assert mf.balance == Decimal("100.001")
+        assert mf.value == Decimal("100000.00")
+
+    def test_parse_summary_mf_row_rejects_non_isin(self):
+        block = _block(_cell("not-an-isin"), _cell("name"))
+        assert nsdl_p._parse_summary_mf_row(block) is None
+
+    def test_parse_mf_holdings_row_with_misplaced_ucc(self):
+        """The NSDL MF Holdings table sometimes renders the UCC as a
+        lone digit (`8`) at the units column's x-position. The parser
+        should fold that into the UCC field rather than the numerics."""
+        block = _block(
+            _cell("INF000A01003\nNOT AVAILABLE", 20.0, 75.0),
+            _cell("ICICI Prudential\nCorporate Bond", 80.0, 145.0),
+            _cell("26777337", 167.0, 198.0),
+            _cell("89,935.20", 204.0, 235.0),
+            _cell("8", 231.9, 235.2),  # misplaced UCC
+            _cell("27.7978", 280.0, 305.0),
+            _cell("25,00,000.00", 320.0, 360.0),
+            _cell("29.3146", 393.0, 418.0),
+            _cell("26,36,414.65", 433.0, 473.0),
+            _cell("1,36,414.65", 486.0, 522.0),
+            _cell("8.61", 561.0, 574.0),
+        )
+        mf = nsdl_p._parse_mf_holdings_row(block)
+        assert mf is not None
+        assert mf.isin == "INF000A01003"
+        assert mf.folio == "26777337"
+        assert mf.balance == Decimal("89935.20")
+        # The misplaced `8` is folded into UCC since the ISIN cell's
+        # UCC line was the placeholder `NOT AVAILABLE`.
+        assert mf.ucc == "8"
+
+    def test_parse_mf_holdings_row_rejects_no_isin(self):
+        block = _block(_cell("not-an-isin", 20.0, 75.0))
+        assert nsdl_p._parse_mf_holdings_row(block) is None
+
+    def test_parsers_reject_empty_block(self):
+        """Every row parser returns None on a Block with zero cells."""
+        empty = _block()
+        assert nsdl_p._parse_equity_row(empty) is None
+        assert nsdl_p._parse_summary_mf_row(empty) is None
+        assert nsdl_p._parse_mf_holdings_row(empty) is None
+        assert cdsl_p._parse_holdings_row(empty) is None
+        assert cdsl_p._parse_mf_holdings_row(empty, {}) is None
+
+    def test_parse_summary_mf_row_too_few_numerics(self):
+        block = _block(
+            _cell("INF000A01002"),
+            _cell("Some Fund"),
+            _cell("1"),
+            _cell("2"),  # only 2 numerics, need ≥ 3
+        )
+        assert nsdl_p._parse_summary_mf_row(block) is None
+
+    def test_find_period_returns_none(self):
+        """`_find_period` returns None when no block's text matches."""
+        blocks = [_block(_cell("nothing about a period here"))]
+        assert nsdl_p._find_period(blocks) is None
+        assert cdsl_p._find_period(blocks) is None
+
+    def test_looks_numeric_handles_empty(self):
+        """`_looks_numeric` returns False on empty / whitespace-only
+        text (covers the early-out branch in both modules)."""
+        assert not nsdl_p._looks_numeric("")
+        assert not nsdl_p._looks_numeric("   ")
+        assert not cdsl_p._looks_numeric("")
+        assert not cdsl_p._looks_numeric("   ")
+
+    def test_per_account_header_joint_form(self):
+        """The NSDL joint-account section header is split across THREE
+        blocks: `NSDL Demat Account / ACCOUNT HOLDERS`, broker + first
+        owner, then `DP ID:… Client ID:…` + second owner. The look-
+        ahead in `_try_per_account_header` should resolve all three to
+        a single account key."""
+        blocks = [
+            _block(
+                _cell("NSDL Demat Account"),
+                _cell("ACCOUNT HOLDERS"),
+                page=11,
+            ),
+            _block(
+                _cell("ACME BROKER LIMITED"),
+                _cell("Holder One (PAN:ABCDE1234F)"),
+                page=11,
+            ),
+            _block(
+                _cell("DP ID: IN123456 Client ID: 99998888"),
+                _cell("Holder Two (PAN:GHIJK5678L)"),
+                page=11,
+            ),
+        ]
+        key, consumed = nsdl_p._try_per_account_header(blocks, 0)
+        assert key == ("NSDL", "IN123456", "99998888")
+        # Three blocks consumed (the header + 2 look-ahead rows).
+        assert consumed == 3
+
+    def test_per_account_header_no_dpc_no_match(self):
+        """A `NSDL Demat Account` block with no DP/Client info in itself
+        or in the next few blocks → no match (returns None)."""
+        blocks = [
+            _block(_cell("NSDL Demat Account"), page=11),
+            _block(_cell("Random unrelated text"), page=11),
+            _block(_cell("Another random line"), page=11),
+        ]
+        key, consumed = nsdl_p._try_per_account_header(blocks, 0)
+        assert key is None
+        assert consumed == 1
+
+    def test_per_account_header_not_demat(self):
+        """A block that doesn't mention `NSDL|CDSL Demat Account` at
+        all isn't a section header."""
+        blocks = [_block(_cell("Just some text"), page=3)]
+        key, consumed = nsdl_p._try_per_account_header(blocks, 0)
+        assert key is None
+        assert consumed == 1
+
+    def test_summary_demat_row_4_cell(self):
+        """Page-2 summary row where broker + DP/Client are joined in a
+        single cell with a newline (4 cells total)."""
+        block = _block(
+            _cell("NSDL Demat Account"),
+            _cell("ACME BROKER LIMITED\nDP ID: IN123456 Client ID: 99998888"),
+            _cell("12"),
+            _cell("1,04,00,929.50"),
+            page=2,
+        )
+        assert nsdl_p._is_summary_demat_row(block)
+        ac, key = nsdl_p._account_from_summary_row(block, owners=[])
+        assert key == ("NSDL", "IN123456", "99998888")
+        assert ac.name == "ACME BROKER LIMITED"
+        assert ac.dp_id == "IN123456"
+        assert ac.client_id == "99998888"
+        assert ac.folios == 12
+        assert ac.balance == Decimal("10400929.50")
+
+    def test_summary_demat_row_5_cell(self):
+        """5-cell variant: broker name and DP/Client line as separate
+        cells (observed on CDSL rows in some NSDL CAS layouts)."""
+        block = _block(
+            _cell("CDSL Demat Account"),
+            _cell("BETA BROKER LIMITED"),
+            _cell("DP ID:11112222 Client ID:33334444"),
+            _cell("25"),
+            _cell("97,34,823.11"),
+            page=2,
+        )
+        assert nsdl_p._is_summary_demat_row(block)
+        ac, key = nsdl_p._account_from_summary_row(block, owners=[])
+        assert key == ("CDSL", "11112222", "33334444")
+        assert ac.name == "BETA BROKER LIMITED"
+        assert ac.folios == 25
+        assert ac.balance == Decimal("9734823.11")
+
+    def test_summary_demat_row_rejects_wrong_cell_count(self):
+        # 3 cells: too short.
+        block = _block(
+            _cell("NSDL Demat Account"),
+            _cell("BROKER\nDP ID: IN123456 Client ID: 99998888"),
+            _cell("12"),
+            page=2,
+        )
+        assert not nsdl_p._is_summary_demat_row(block)
+
+    def test_parse_bond_summary_row(self):
+        """NSDL-flavour summary bonds row — discriminates frequency
+        (text) from coupon-rate (numeric) within the shared x-band."""
+        block = _block(
+            _cell("INE000A07001", 20.7, 67.1),
+            _cell("EXAMPLE BOND\nISSUER\nLIMITED", 93.2, 168.2),
+            _cell("Once a year", 185.8, 223.7),  # frequency text
+            _cell("8.10", 198.0, 211.0),  # coupon rate numeric
+            _cell("05-Mar-2022", 250.9, 290.3),
+            _cell("200", 354.3, 365.4),
+            _cell("1,000.00", 442.6, 468.7),
+            _cell("2,00,000.00", 538.2, 574.7),
+        )
+        bd = nsdl_p._parse_bond_summary_row(block)
+        assert bd is not None
+        assert bd.isin == "INE000A07001"
+        assert bd.name == "EXAMPLE BOND ISSUER LIMITED"
+        assert bd.coupon_rate == Decimal("8.10")
+        assert bd.coupon_frequency == "Once a year"
+        assert bd.maturity_date == "05-Mar-2022"
+        assert bd.num_bonds == Decimal("200")
+        assert bd.face_value == Decimal("1000.00")
+        assert bd.value == Decimal("200000.00")
+        # Detailed-only fields stay None.
+        assert bd.market_price is None
+
+    def test_parse_bond_summary_row_rejects_non_isin(self):
+        block = _block(_cell("Not an ISIN"), _cell("..."))
+        assert nsdl_p._parse_bond_summary_row(block) is None
+
+    def test_parse_bond_summary_row_rejects_empty(self):
+        block = _block()
+        assert nsdl_p._parse_bond_summary_row(block) is None
+
+    def test_parse_bond_detailed_row(self):
+        """CDSL-flavour 13-cell detailed bonds row."""
+        block = _block(
+            _cell("INE000A07002"),
+            _cell("EXAMPLE BOND ISSUER LIMITED 8.71% NCD"),
+            _cell("100.000"),
+            _cell("100.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("1,276.47"),
+            _cell("1,27,647.00"),
+        )
+        bd = nsdl_p._parse_bond_detailed_row(block)
+        assert bd is not None
+        assert bd.isin == "INE000A07002"
+        assert bd.num_bonds == Decimal("100.000")
+        assert bd.market_price == Decimal("1276.47")
+        assert bd.value == Decimal("127647.00")
+        # Summary-only fields stay None.
+        assert bd.coupon_rate is None
+        assert bd.face_value is None
+        assert bd.maturity_date is None
+
+    def test_parse_bond_detailed_row_rejects_non_isin(self):
+        block = _block(_cell("Subtotal"), _cell("..."))
+        assert nsdl_p._parse_bond_detailed_row(block) is None
+
+    def test_parse_detailed_mf_row(self):
+        """CDSL-flavour 'Mutual Funds (M)' detailed row — INF ISIN."""
+        block = _block(
+            _cell("INF000A01001"),
+            _cell("EXAMPLE FUND HOUSE"),
+            _cell("22,994.003"),
+            _cell("22,994.003"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("0.000"),
+            _cell("22.55"),
+            _cell("5,18,399.80"),
+        )
+        mf = nsdl_p._parse_detailed_mf_row(block)
+        assert mf is not None
+        assert mf.isin == "INF000A01001"
+        assert mf.balance == Decimal("22994.003")
+        assert mf.nav == Decimal("22.55")
+        assert mf.value == Decimal("518399.80")
+
+    def test_parse_detailed_mf_row_rejects_equity_isin(self):
+        """Equity ISIN (INE…) must NOT match the MF detailed parser."""
+        block = _block(
+            _cell("INE000A07002"),
+            _cell("Some equity"),
+            _cell("100"),
+            _cell("1000"),
+            _cell("100000"),
+        )
+        assert nsdl_p._parse_detailed_mf_row(block) is None
+
+
+class TestISINSearchFallback:
+    """The direct-ISIN fallback path activates when the primary
+    (scheme, rta, rta_code) lookup misses but the caller hinted at an
+    inline ISIN parsed from the scheme header."""
+
+    def test_direct_isin_fallback(self):
+        from casparser.parsers._isin import isin_search
+
+        # Garbage rta/rta_code but real ISIN → fallback path resolves.
+        isin, amfi, scheme_type = isin_search(
+            "scheme name doesn't matter",
+            "BAD_RTA",
+            "bogus_code",
+            isin="INF846K01EW2",
+        )
+        assert isin == "INF846K01EW2"
+        assert amfi == "120503"
+        assert scheme_type == "EQUITY"
+
+    def test_direct_isin_fallback_unknown_isin(self):
+        """An unknown ISIN with no other lookup keys returns nones."""
+        from casparser.parsers._isin import isin_search
+
+        isin, amfi, scheme_type = isin_search(
+            "",
+            "BAD",
+            "bogus",
+            isin="INF000X00X00",
+        )
+        # No match anywhere → all None.
+        assert isin is None
+        assert amfi is None
+        assert scheme_type is None
diff --git a/tests/test_errors.py b/tests/test_errors.py
new file mode 100644
index 0000000..daf2c6b
--- /dev/null
+++ b/tests/test_errors.py
@@ -0,0 +1,72 @@
+"""Error-path and back-compat tests.
+
+Covers:
+  * Incorrect password → `IncorrectPasswordError`
+  * Non-PDF / corrupt input → `CASParseError`
+  * Unrecognised CAS issuer → `CASParseError`
+  * Deprecated `force_pdfminer=True` kwarg still parses (DeprecationWarning)
+"""
+
+from __future__ import annotations
+
+import io
+import warnings
+
+import pytest
+
+from casparser import read_cas_pdf
+from casparser.exceptions import CASParseError, IncorrectPasswordError
+
+
+class TestPasswordErrors:
+    def test_incorrect_password_raises(self, cams_file):
+        with pytest.raises(IncorrectPasswordError) as exc:
+            read_cas_pdf(cams_file, "")
+        assert "Incorrect PDF password!" in str(exc.value)
+
+
+class TestInputValidation:
+    def test_non_pdf_buffer_raises_cas_parse_error(self):
+        with io.BytesIO(b"this is not a pdf") as fp, pytest.raises(CASParseError) as exc:
+            read_cas_pdf(fp, "")
+        msg = str(exc.value)
+        assert "Unhandled error while opening" in msg or "Could not" in msg
+
+    def test_non_pdf_typeerror_wraps_as_cas_parse_error(self):
+        """Passing a wrong-type input (here: an int) surfaces as
+        `CASParseError`, not a raw `TypeError`."""
+        with pytest.raises(CASParseError):
+            read_cas_pdf(1, "")
+
+    def test_unknown_issuer_pdf_raises(self, tmp_path):
+        """A valid PDF without any CAS marker reports the issuer-
+        detection failure cleanly."""
+        import pypdfium2 as pdfium
+
+        pdf_path = tmp_path / "blank.pdf"
+        pdf = pdfium.PdfDocument.new()
+        pdf.new_page(595, 842)
+        pdf.save(str(pdf_path))
+        with pytest.raises(CASParseError) as exc:
+            read_cas_pdf(str(pdf_path), "")
+        assert "Could not identify" in str(exc.value)
+
+
+class TestBackCompatShims:
+    def test_force_pdfminer_deprecated(self, cams_file, cams_password):
+        """`force_pdfminer=True` is preserved as a no-op + emits a
+        `DeprecationWarning`. Removing it would break callers that
+        carried the kwarg over from <1.0 releases."""
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            data = read_cas_pdf(
+                cams_file,
+                cams_password,
+                force_pdfminer=True,
+            )
+        assert any(
+            issubclass(w.category, DeprecationWarning) and "force_pdfminer" in str(w.message)
+            for w in caught
+        ), "expected DeprecationWarning mentioning force_pdfminer"
+        # Result is identical to a normal parse (back-compat).
+        assert data.folios
diff --git a/tests/test_gains_e2e.py b/tests/test_gains_e2e.py
new file mode 100644
index 0000000..2a14e38
--- /dev/null
+++ b/tests/test_gains_e2e.py
@@ -0,0 +1,129 @@
+"""End-to-end tests for the capital-gains analysis module.
+
+Drives `CapitalGainsReport` and its CSV / 112A exports through a
+real parsed KFin DETAILED statement. The fund-level unit tests in
+`tests/test_gains.py` cover the building blocks (CII lookup, fund
+type detection, MergedTransaction, FIFOUnits internals); these
+exercise the report's public API end-to-end so the import-side and
+formatting-side paths get hit.
+"""
+
+from __future__ import annotations
+
+import os
+
+import pytest
+
+from casparser import read_cas_pdf
+from casparser.analysis import CapitalGainsReport
+from casparser.exceptions import IncompleteCASError
+
+
+@pytest.fixture(scope="module")
+def kfintech_cas():
+    path = os.getenv("KFINTECH_CAS_FILE_NEW")
+    pw = os.getenv("KFINTECH_CAS_PASSWORD")
+    if not path:
+        pytest.skip("KFINTECH_CAS_FILE_NEW not set")
+    return read_cas_pdf(path, pw)
+
+
+def test_capital_gains_report_basic(kfintech_cas):
+    """CapitalGainsReport is constructible from a parsed CASData
+    and exposes the documented surface."""
+    report = CapitalGainsReport(kfintech_cas)
+    # `has_gains` / `has_error` are simple guards we want covered.
+    assert isinstance(report.has_gains(), bool)
+    assert isinstance(report.has_error(), bool)
+    # Whether the sample has gains depends on the FY of its
+    # transactions, but the FY list should at minimum be a list.
+    fy_list = report.get_fy_list()
+    assert isinstance(fy_list, list)
+    # Sums are decimals, populated even on empty datasets.
+    assert report.invested_amount is not None
+    assert report.current_value is not None
+
+
+def test_capital_gains_summary(kfintech_cas):
+    """`get_summary` renders the FY → totals breakdown."""
+    report = CapitalGainsReport(kfintech_cas)
+    summary = report.get_summary()
+    # Returns an iterable of rows / strings — just confirm it ran.
+    assert summary is not None
+
+
+def test_capital_gains_csv_outputs(kfintech_cas):
+    """The two CSV exports return strings even when there are no
+    realised gains in the sample."""
+    report = CapitalGainsReport(kfintech_cas)
+    summary_csv = report.get_summary_csv_data()
+    detailed_csv = report.get_gains_csv_data()
+    assert isinstance(summary_csv, str)
+    assert isinstance(detailed_csv, str)
+
+
+def test_capital_gains_112a_report(kfintech_cas):
+    """The 112A FY-specific report can be generated even when the FY
+    has no entries (returns an empty list)."""
+    report = CapitalGainsReport(kfintech_cas)
+    fys = report.get_fy_list()
+    # Pick any FY with entries; otherwise try a known historical FY
+    # — the helper should not crash on an FY with no rows either.
+    target_fy = fys[0] if fys else "FY2020-21"
+    entries = report.generate_112a(target_fy)
+    assert isinstance(entries, list)
+    csv_blob = report.generate_112a_csv_data(target_fy)
+    assert isinstance(csv_blob, str)
+
+
+def test_incomplete_cas_raises():
+    """Gains analysis on a CAS where any folio has a non-zero opening
+    balance should raise IncompleteCASError."""
+    cams_path = os.getenv("CAMS_CAS_FILE")
+    cams_pw = os.getenv("CAMS_CAS_PASSWORD")
+    if not cams_path:
+        pytest.skip("CAMS_CAS_FILE not set")
+    data = read_cas_pdf(cams_path, cams_pw)
+    # CAMS sample's first statement period is mid-stream — opening
+    # balances are non-zero, so the report must refuse to compute.
+    has_open_bal = any(
+        sch.open >= Decimal("0.01") and sch.transactions for f in data.folios for sch in f.schemes
+    )
+    if not has_open_bal:
+        pytest.skip("sample doesn't have non-zero opening balance schemes")
+    with pytest.raises(IncompleteCASError):
+        CapitalGainsReport(data)
+
+
+def test_gains_cli(tmp_path):
+    """`-g --gains-112a FY2020-21` exercises the full capital-gains
+    pipeline through the CLI — the user-facing entry point that
+    composes parsing + gains analysis + CSV export."""
+    kfin = os.getenv("KFINTECH_CAS_FILE_NEW")
+    if not kfin:
+        pytest.skip("KFINTECH_CAS_FILE_NEW not set")
+    from click.testing import CliRunner
+
+    from casparser.cli import cli
+
+    out = tmp_path / "gains.csv"
+    result = CliRunner().invoke(
+        cli,
+        [
+            kfin,
+            "-p",
+            os.getenv("KFINTECH_CAS_PASSWORD"),
+            "-g",
+            "--gains-112a",
+            "FY2020-21",
+            "-o",
+            str(out),
+        ],
+    )
+    # 0 = success; 2 = "no gains for that FY" — both acceptable; the
+    # goal is exercising the import + analysis paths.
+    assert result.exit_code in (0, 2), f"unexpected exit {result.exit_code}: {result.output}"
+
+
+# Decimal import at file bottom keeps the e2e test module small.
+from decimal import Decimal  # noqa: E402
diff --git a/tests/test_helpers.py b/tests/test_helpers.py
new file mode 100644
index 0000000..f842474
--- /dev/null
+++ b/tests/test_helpers.py
@@ -0,0 +1,132 @@
+"""Unit tests for the small reusable helpers that survived v1.0:
+
+- `casparser.parsers._classify.get_transaction_type`
+- `casparser.parsers._classify.get_parsed_scheme_name`
+- `casparser.parsers._isin.isin_search`
+"""
+
+from decimal import Decimal
+
+from casparser.enums import TransactionType
+from casparser.parsers._classify import (
+    get_parsed_scheme_name,
+    get_transaction_type,
+)
+from casparser.parsers._isin import isin_search
+
+
+class TestTransactionType:
+    def test_basic_types(self):
+        assert get_transaction_type("Redemption", Decimal("-100")) == (
+            TransactionType.REDEMPTION,
+            None,
+        )
+        assert get_transaction_type("Address updated", None) == (
+            TransactionType.MISC,
+            None,
+        )
+        assert get_transaction_type("***STT paid ***", None) == (
+            TransactionType.STT_TAX,
+            None,
+        )
+        assert get_transaction_type("***stamp duty***", None) == (
+            TransactionType.STAMP_DUTY_TAX,
+            None,
+        )
+        assert get_transaction_type("*** TDS on Above ***", None) == (
+            TransactionType.TDS_TAX,
+            None,
+        )
+        assert get_transaction_type(
+            "Creation of units - Segregated portfolio",
+            Decimal("1"),
+        ) == (TransactionType.SEGREGATION, None)
+
+    def test_unknown_zero_units(self):
+        assert get_transaction_type("***Random text***", Decimal("0")) == (
+            TransactionType.UNKNOWN,
+            None,
+        )
+
+    def test_reversal(self):
+        assert get_transaction_type(
+            "Purchase SIPCheque Dishonoured - Instalment No 108",
+            Decimal("-1"),
+        ) == (TransactionType.REVERSAL, None)
+
+    def test_dividends(self):
+        assert get_transaction_type(
+            "IDCW Reinvestment @ Rs.2.00 per unit",
+            Decimal("1"),
+        ) == (TransactionType.DIVIDEND_REINVEST, Decimal("2.00"))
+        assert get_transaction_type(
+            "IDCW Reinvested @ Rs.0.0241 per unit",
+            Decimal("1"),
+        ) == (TransactionType.DIVIDEND_REINVEST, Decimal("0.0241"))
+        assert get_transaction_type(
+            "IDCW Paid @ Rs.0.06 per unit",
+            Decimal("1"),
+        ) == (TransactionType.DIVIDEND_PAYOUT, Decimal("0.06"))
+        assert get_transaction_type(
+            "Div. Reinvested @ Rs.0.0241 per unit",
+            Decimal("1"),
+        ) == (TransactionType.DIVIDEND_REINVEST, Decimal("0.0241"))
+
+
+class TestParsedSchemeName:
+    def test_passthrough(self):
+        assert (
+            get_parsed_scheme_name("Axis Long Term Equity Fund - Direct Growth")
+            == "Axis Long Term Equity Fund - Direct Growth"
+        )
+
+    def test_trailing_whitespace(self):
+        assert (
+            get_parsed_scheme_name("Axis Bluechip Fund - Regular Growth ")
+            == "Axis Bluechip Fund - Regular Growth"
+        )
+
+    def test_formerly_known_as_stripped(self):
+        assert (
+            get_parsed_scheme_name(
+                "HSBC Corporate Bond Fund - Regular Growth "
+                "(Formerly known as L&T Triple Ace Bond Fund - Growth)"
+            )
+            == "HSBC Corporate Bond Fund - Regular Growth"
+        )
+
+    def test_erstwhile_stripped(self):
+        assert (
+            get_parsed_scheme_name(
+                "Bandhan ELSS Tax saver Fund-Growth-(Regular Plan)"
+                "(erstwhile Bandhan Tax Advantage ELSS Fund-Growth-Regular Plan)"
+            )
+            == "Bandhan ELSS Tax saver Fund-Growth-(Regular Plan)"
+        )
+
+    def test_non_demat_stripped(self):
+        assert (
+            get_parsed_scheme_name(
+                "Bandhan Liquid Fund-Growth-(Regular Plan) "
+                "(erstwhile IDFC Cash Fund-Growth-Regular Plan) (Non-Demat) "
+            )
+            == "Bandhan Liquid Fund-Growth-(Regular Plan)"
+        )
+
+
+class TestISINSearch:
+    def test_kfintech_lookup(self):
+        isin, amfi, scheme_type = isin_search(
+            "Axis Long Term Equity Fund - Direct Growth",
+            "KFINTECH",
+            "128TSDGG",
+        )
+        assert isin == "INF846K01EW2"
+        assert amfi == "120503"
+        assert scheme_type == "EQUITY"
+
+    def test_no_match(self):
+        isin, amfi, scheme_type = isin_search("", "KARVY", "")
+        assert isin is None
+        assert amfi is None
+        assert scheme_type is None
diff --git a/tests/test_kfin.py b/tests/test_kfin.py
new file mode 100644
index 0000000..b767a89
--- /dev/null
+++ b/tests/test_kfin.py
@@ -0,0 +1,145 @@
+"""End-to-end tests for KFintech CAS files.
+
+Mirrors the structure of `tests/test_cams.py`: two detailed fixtures
+(short-period `KFINTECH_CAS_FILE` + multi-decade `KFINTECH_CAS_FILE_NEW`)
+plus a summary fixture (`KFINTECH_CAS_SUMMARY`).
+"""
+
+from __future__ import annotations
+
+import json
+
+from click.testing import CliRunner
+
+from casparser.enums import CASFileType
+
+from ._assertions import (
+    assert_folio_well_formed,
+    assert_investor_info_complete,
+    assert_scheme_transaction_units_close,
+    assert_scheme_valuation_arithmetic,
+    assert_scheme_well_formed,
+)
+
+# Exact fixture shape (folios, schemes).
+DETAILED = {
+    "main": dict(folios=17, schemes=30, period_from="01-Jan-1990", period_to="31-Mar-2021"),
+    "new": dict(folios=14, schemes=30, period_from="01-Jan-2000", period_to="03-Sep-2023"),
+}
+SUMMARY = dict(folios=9, schemes=13)
+
+
+class TestKFinDetailed:
+    """Long-history KFintech DETAILED statement (`KFINTECH_CAS_FILE`)."""
+
+    def test_shape(self, kfin_data):
+        d = kfin_data
+        assert d.file_type == "KFINTECH"
+        assert d.cas_type == CASFileType.DETAILED.value
+        assert d.statement_period.from_ == DETAILED["main"]["period_from"]
+        assert d.statement_period.to == DETAILED["main"]["period_to"]
+        assert len(d.folios) == DETAILED["main"]["folios"]
+        total_schemes = sum(len(f.schemes) for f in d.folios)
+        assert total_schemes == DETAILED["main"]["schemes"]
+
+    def test_investor_info(self, kfin_data):
+        assert_investor_info_complete(kfin_data.investor_info)
+
+    def test_every_folio_well_formed(self, kfin_data):
+        for folio in kfin_data.folios:
+            assert_folio_well_formed(folio)
+
+    def test_every_scheme_well_formed(self, kfin_data):
+        for folio in kfin_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_well_formed(scheme)
+
+    def test_close_times_nav_equals_valuation(self, kfin_data):
+        for folio in kfin_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_valuation_arithmetic(scheme)
+
+    def test_open_plus_units_equals_close(self, kfin_data):
+        """`scheme.open + Σ(txn.units) == scheme.close` for every
+        scheme. Now possible thanks to the same-font subset-cluster
+        dedup in extract.py — previously the KFin date overlay
+        would corrupt some SIP rows and break this invariant."""
+        for folio in kfin_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_transaction_units_close(scheme)
+
+
+class TestKFinDetailedNew:
+    """Multi-decade KFintech DETAILED statement (`KFINTECH_CAS_FILE_NEW`)."""
+
+    def test_shape(self, kfin_new_data):
+        d = kfin_new_data
+        assert d.file_type == "KFINTECH"
+        assert d.cas_type == CASFileType.DETAILED.value
+        assert d.statement_period.from_ == DETAILED["new"]["period_from"]
+        assert d.statement_period.to == DETAILED["new"]["period_to"]
+        assert len(d.folios) == DETAILED["new"]["folios"]
+        total_schemes = sum(len(f.schemes) for f in d.folios)
+        assert total_schemes == DETAILED["new"]["schemes"]
+
+    def test_every_scheme_well_formed(self, kfin_new_data):
+        for folio in kfin_new_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_well_formed(scheme)
+
+    def test_close_times_nav_equals_valuation(self, kfin_new_data):
+        for folio in kfin_new_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_valuation_arithmetic(scheme)
+
+    def test_open_plus_units_equals_close(self, kfin_new_data):
+        for folio in kfin_new_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_transaction_units_close(scheme)
+
+
+class TestKFinSummary:
+    """KFintech SUMMARY statement (`KFINTECH_CAS_SUMMARY`)."""
+
+    def test_shape(self, kfin_summary_data):
+        d = kfin_summary_data
+        assert d.file_type == "KFINTECH"
+        assert d.cas_type == CASFileType.SUMMARY.value
+        assert len(d.folios) == SUMMARY["folios"]
+        total_schemes = sum(len(f.schemes) for f in d.folios)
+        assert total_schemes == SUMMARY["schemes"]
+
+    def test_investor_info(self, kfin_summary_data):
+        assert_investor_info_complete(kfin_summary_data.investor_info)
+
+    def test_every_scheme_well_formed(self, kfin_summary_data):
+        for folio in kfin_summary_data.folios:
+            for scheme in folio.schemes:
+                assert_scheme_well_formed(scheme)
+
+
+class TestKFinCLI:
+    """One CLI invocation each for the JSON output path and the
+    wrong-password error path. Other CLI semantics are covered by
+    `test_cams.py`."""
+
+    def test_json_output(self, tmp_path, kfin_file, kfin_password):
+        from casparser.cli import cli
+
+        out = tmp_path / "out.json"
+        result = CliRunner().invoke(
+            cli,
+            [kfin_file, "-p", kfin_password, "-o", str(out)],
+        )
+        assert result.exit_code == 0, result.output
+        payload = json.loads(out.read_text())
+        assert payload["file_type"] == "KFINTECH"
+
+    def test_wrong_password(self, kfin_file, cams_password):
+        """Using the CAMS password against a KFin file errors out
+        cleanly through the CLI."""
+        from casparser.cli import cli
+
+        result = CliRunner().invoke(cli, [kfin_file, "-p", cams_password])
+        assert result.exit_code != 0
+        assert "Incorrect PDF password!" in result.output
diff --git a/tests/test_mupdf.py b/tests/test_mupdf.py
deleted file mode 100644
index ab3df79..0000000
--- a/tests/test_mupdf.py
+++ /dev/null
@@ -1,110 +0,0 @@
-import re
-
-import fitz
-import pytest
-from click.testing import CliRunner
-
-from casparser.enums import FileType
-from casparser.exceptions import CASParseError
-
-from .base import BaseTestClass
-
-
-class TestMuPDF(BaseTestClass):
-    """Test PyMuPDF parser."""
-
-    def test_output_csv(self):
-        output = self.read_pdf(self.cams_file_name, self.cams_password, output="csv")
-        assert isinstance(output, str)
-
-    def test_cli(self, tmpdir):
-        from casparser.cli import cli
-
-        runner = CliRunner()
-
-        fpath = tmpdir.join("output.json")
-        result = runner.invoke(
-            cli, [self.cams_file_name, "-p", self.cams_password, "-o", fpath.strpath]
-        )
-        assert result.exit_code == 0
-        assert "File saved" in result.output
-
-        fpath = tmpdir.join("output.txt")
-        result = runner.invoke(
-            cli,
-            [
-                self.cams_summary_file_name,
-                "-p",
-                self.cams_password,
-                "-o",
-                fpath.strpath,
-                "-s",
-            ],
-        )
-        assert result.exit_code != 1
-        assert "File saved" in result.output
-
-        fpath = tmpdir.join("output.csv")
-        result = runner.invoke(
-            cli, [self.cams_file_name, "-p", self.cams_password, "-o", fpath.strpath]
-        )
-        assert result.exit_code != 1
-        assert "File saved" in result.output
-
-        fpath = tmpdir.join("output.csv")
-        result = runner.invoke(
-            cli,
-            [
-                self.kfintech_file_name,
-                "-p",
-                self.kfintech_password,
-                "-o",
-                fpath.strpath,
-                "-s",
-                "-g",
-                "--gains-112a",
-                "FY2020-21",
-            ],
-        )
-        assert result.exit_code != 1
-        assert "File saved" in result.output
-
-        result = runner.invoke(cli, [self.kfintech_file_name, "-p", self.kfintech_password, "-s"])
-        assert result.exit_code != 1
-
-        result = runner.invoke(cli, [self.kfintech_file_name, "-p", self.cams_password])
-        assert result.exit_code != 0
-        assert "Incorrect PDF password!" in result.output
-
-        result = runner.invoke(cli, [self.cams_file_name, "-p", self.cams_password, "-g"])
-        assert result.exit_code == 2
-        assert "CAS is incomplete!" in result.output
-
-        result = runner.invoke(cli, [self.bad_file_name, "-p", "", "-a"])
-        assert result.exit_code == 0
-        clean_output = self.ansi_cleaner.sub("", result.output)
-        assert re.search(r"Error\s+:\s+1\s+schemes", clean_output) is not None
-
-    def test_bad_investor_info(self):
-        from casparser.parsers.mupdf import parse_investor_info
-
-        with pytest.raises(CASParseError) as exc_info:
-            parse_investor_info({"width": 0, "height": 0, "blocks": []}, fitz.Rect())
-        assert "Unable to parse investor data" in str(exc_info)
-
-    def test_bad_file_type(self):
-        from casparser.parsers.mupdf import parse_file_type
-
-        file_type = parse_file_type([])
-        assert file_type == FileType.UNKNOWN
-
-    def test_nsdl_statement(self):
-        from casparser.cli import cli
-
-        runner = CliRunner()
-        result = runner.invoke(cli, [self.nsdl_file_name, "-p", "", "-a"])
-        assert result.exit_code == 0
-        clean_output = self.ansi_cleaner.sub("", result.output)
-
-        assert re.search(r"Matched\s+:\s+3\s+accounts", clean_output) is not None
-        assert re.search(r"Error\s+:\s+0\s+accounts", clean_output) is not None
diff --git a/tests/test_nsdl.py b/tests/test_nsdl.py
new file mode 100644
index 0000000..7668201
--- /dev/null
+++ b/tests/test_nsdl.py
@@ -0,0 +1,156 @@
+"""End-to-end tests for NSDL CAS statements.
+
+Single fixture (`NSDL_CAS_FILE_1`, unencrypted) carrying:
+
+  * 1 NSDL demat account (equities + summary-form bonds)
+  * 1 CDSL demat account (equities + detailed MFs + detailed bonds)
+  * 1 Mutual Fund Folios pseudo-account
+
+The shape is locked in below (counts only — rupee figures stay out
+of the repo). Arithmetic invariants from `_assertions` validate the
+parsed numerics without exposing private totals.
+"""
+
+from __future__ import annotations
+
+from click.testing import CliRunner
+
+from ._assertions import (
+    assert_account_balance_closes,
+    assert_bond_detailed_form,
+    assert_bond_summary_form,
+    assert_demat_account_well_formed,
+    assert_equity_well_formed,
+    assert_mutual_fund_well_formed,
+)
+
+# Exact NSDL fixture shape. Bond counts split into summary-form (NSDL
+# demat account) and detailed-form (CDSL demat account).
+EXPECTED_ACCOUNTS = 3
+
+EXPECTED_PER_ACCOUNT = [
+    # (type, equities, mutual_funds, bonds_summary, bonds_detailed)
+    ("NSDL Demat Account", 5, 0, 7, 0),
+    ("CDSL Demat Account", 12, 4, 0, 9),
+    ("Mutual Fund Folios", 0, 13, 0, 0),
+]
+
+PERIOD_FROM = "01-Dec-2020"
+PERIOD_TO = "31-Dec-2020"
+
+
+class TestNSDLStatement:
+    """Top-level shape + per-account holdings counts."""
+
+    def test_file_type_and_period(self, nsdl_data):
+        # `use_enum_values=True` on the model — file_type is a str.
+        assert nsdl_data.file_type == "NSDL"
+        assert nsdl_data.statement_period.from_ == PERIOD_FROM
+        assert nsdl_data.statement_period.to == PERIOD_TO
+
+    def test_account_count(self, nsdl_data):
+        assert len(nsdl_data.accounts) == EXPECTED_ACCOUNTS
+
+    def test_per_account_holdings_counts(self, nsdl_data):
+        """Each account's equity / MF / bond count matches the
+        fixture exactly. Bond counts are split into summary vs
+        detailed form by inspecting the per-bond fields."""
+        for i, (exp_type, n_eq, n_mf, n_bd_sum, n_bd_det) in enumerate(EXPECTED_PER_ACCOUNT):
+            ac = nsdl_data.accounts[i]
+            assert ac.type == exp_type, f"acc {i}: type {ac.type!r}"
+            assert len(ac.equities) == n_eq, (
+                f"acc {i} ({exp_type}): expected {n_eq} equities, " f"got {len(ac.equities)}"
+            )
+            assert len(ac.mutual_funds) == n_mf, (
+                f"acc {i} ({exp_type}): expected {n_mf} MFs, " f"got {len(ac.mutual_funds)}"
+            )
+            summary_bonds = sum(1 for b in ac.bonds if b.face_value is not None)
+            detailed_bonds = sum(1 for b in ac.bonds if b.market_price is not None)
+            assert len(ac.bonds) == n_bd_sum + n_bd_det
+            assert (
+                summary_bonds == n_bd_sum
+            ), f"acc {i}: expected {n_bd_sum} summary-form bonds, got {summary_bonds}"
+            assert (
+                detailed_bonds == n_bd_det
+            ), f"acc {i}: expected {n_bd_det} detailed-form bonds, got {detailed_bonds}"
+
+    def test_investor_name_set(self, nsdl_data):
+        # NSDL/CDSL investor extractor populates `name`; mobile/email
+        # are not always reliable on NSDL CAS, so we only require name.
+        assert nsdl_data.investor_info.name
+
+
+class TestNSDLAccountInvariants:
+    """Arithmetic invariants on each account's holdings."""
+
+    def test_account_well_formed(self, nsdl_data):
+        for ac in nsdl_data.accounts:
+            assert_demat_account_well_formed(ac)
+
+    def test_account_balance_closes(self, nsdl_data):
+        """Σ(equity.value) + Σ(mf.value) + Σ(bond.value) ==
+        account.balance for every account. Catches misrouted rows
+        and missing-row bugs."""
+        for ac in nsdl_data.accounts:
+            assert_account_balance_closes(ac)
+
+    def test_equity_rows_well_formed(self, nsdl_data):
+        for ac in nsdl_data.accounts:
+            for eq in ac.equities:
+                assert_equity_well_formed(eq)
+
+    def test_mutual_fund_rows_well_formed(self, nsdl_data):
+        """`balance * nav ≈ value` for every MF holding."""
+        for ac in nsdl_data.accounts:
+            for mf in ac.mutual_funds:
+                assert_mutual_fund_well_formed(mf)
+
+
+class TestNSDLBonds:
+    """Per-bond invariants split by source form."""
+
+    def test_summary_form_bonds(self, nsdl_data):
+        """Summary-form bonds (NSDL-account page): full metadata,
+        `num_bonds * face_value == value` exactly."""
+        summary_bonds = [
+            b for ac in nsdl_data.accounts for b in ac.bonds if b.face_value is not None
+        ]
+        assert summary_bonds, "no summary-form bonds found in fixture"
+        for bd in summary_bonds:
+            assert_bond_summary_form(bd)
+
+    def test_detailed_form_bonds(self, nsdl_data):
+        """Detailed-form bonds (CDSL-account page): only quantity +
+        market_price + value, `num_bonds * market_price ≈ value`."""
+        detailed_bonds = [
+            b for ac in nsdl_data.accounts for b in ac.bonds if b.market_price is not None
+        ]
+        assert detailed_bonds, "no detailed-form bonds found in fixture"
+        for bd in detailed_bonds:
+            assert_bond_detailed_form(bd)
+
+    def test_every_bond_belongs_to_exactly_one_form(self, nsdl_data):
+        """A row is either summary-form (face_value set) or detailed
+        (market_price set) — never both, never neither."""
+        for ac in nsdl_data.accounts:
+            for bd in ac.bonds:
+                has_summary = bd.face_value is not None
+                has_detailed = bd.market_price is not None
+                assert has_summary ^ has_detailed, (
+                    f"bond {bd.isin} ambiguous: "
+                    f"face_value={bd.face_value} market_price={bd.market_price}"
+                )
+
+
+class TestNSDLCLI:
+    def test_cli_renders_table(self, nsdl_file):
+        """`casparser <nsdl_file>` renders the rich-table view without
+        a password (this fixture is unencrypted)."""
+        from casparser.cli import cli
+        from tests.conftest import strip_ansi
+
+        result = CliRunner().invoke(cli, [nsdl_file, "-p", "", "-a"])
+        assert result.exit_code == 0
+        clean = strip_ansi(result.output)
+        assert "Statement Period :" in clean
+        assert "NSDL" in clean
diff --git a/tests/test_pdfminer.py b/tests/test_pdfminer.py
deleted file mode 100644
index 44ca77b..0000000
--- a/tests/test_pdfminer.py
+++ /dev/null
@@ -1,64 +0,0 @@
-import sys
-
-import pytest
-from pdfminer.layout import LTTextBoxHorizontal
-
-from casparser import read_cas_pdf
-from casparser.exceptions import CASParseError
-
-from .base import BaseTestClass
-
-try:
-    import builtins
-except ImportError:
-    import __builtin__ as builtins
-
-realimport = builtins.__import__
-
-
-def mockimport(name, *args):
-    """Force ImportError on fitz and/or mupdf import and make casparser fallback to pdfminer"""
-    if name in ("fitz", "mupdf"):
-        raise ImportError
-    return realimport(name, *args)
-
-
-@pytest.fixture(scope="class")
-def monkeyclass():
-    with pytest.MonkeyPatch.context() as mp:
-        yield mp
-
-
-@pytest.fixture(scope="class")
-def use_pdfminer(monkeyclass):
-    if "fitz" in sys.modules:
-        del sys.modules["fitz"]
-    monkeyclass.setattr(builtins, "__import__", mockimport)
-    yield
-    monkeyclass.setattr(builtins, "__import__", realimport)
-
-
-@pytest.mark.usefixtures("use_pdfminer")
-class TestPDFMiner(BaseTestClass):
-    """Test pdfminer parser."""
-
-    @classmethod
-    def setup_class(cls):
-        BaseTestClass.setup_class()
-
-    def test_bad_investor_info(self):
-        from casparser.parsers.pdfminer import parse_investor_info_mf
-
-        with pytest.raises(CASParseError) as exc_info:
-            box = LTTextBoxHorizontal()
-            box.get_text()
-            parse_investor_info_mf([], 0, 0)
-        assert "Unable to parse investor data" in str(exc_info)
-
-    def test_invalid_file_type(self):
-        with pytest.raises(CASParseError) as exc_info:
-            read_cas_pdf(1, "", force_pdfminer=True)
-        assert "Invalid input" in str(exc_info)
-
-        with pytest.raises(CASParseError) as exc_info:
-            read_cas_pdf(self.nsdl_file_name, "", force_pdfminer=True)
diff --git a/tests/test_process.py b/tests/test_process.py
deleted file mode 100644
index edc6b38..0000000
--- a/tests/test_process.py
+++ /dev/null
@@ -1,155 +0,0 @@
-from decimal import Decimal
-
-import pytest
-
-from casparser.enums import TransactionType
-from casparser.exceptions import CASParseError, HeaderParseError
-from casparser.process import process_cas_text
-from casparser.process.cas_detailed import (
-    ParsedTransaction,
-    get_parsed_scheme_name,
-    get_transaction_type,
-    parse_header,
-    parse_transaction,
-)
-from casparser.process.cas_summary import parse_header as parse_summary_header
-from casparser.process.utils import isin_search
-
-
-class TestProcessClass:
-    def test_detailed_header_parser(self):
-        good_header = "Consolidated Account Statement\n01-Apr-2018 To 31-Mar-2019"
-        bad_header = "Consolidated Account Statement\n01-Apr-2018"
-
-        header_data = parse_header(good_header)
-        assert header_data == {"from": "01-Apr-2018", "to": "31-Mar-2019"}
-
-        with pytest.raises(HeaderParseError):
-            parse_header(bad_header)
-
-    def test_summary_header_parser(self):
-        good_header = "Consolidated Account Summary\nAs On 01-Apr-2018"
-        bad_header = "Consolidated Account Summary\n01-Apr-2018"
-
-        header_data = parse_summary_header(good_header)
-        assert header_data == {"date": "01-Apr-2018"}
-
-        with pytest.raises(HeaderParseError):
-            parse_summary_header(bad_header)
-
-    def test_process_bad_cas(self):
-        with pytest.raises(CASParseError):
-            process_cas_text("")
-
-    def test_transaction_type(self):
-        assert get_transaction_type("Redemption", Decimal(-100.0)) == (
-            TransactionType.REDEMPTION,
-            None,
-        )
-        assert get_transaction_type("Address updated", None) == (TransactionType.MISC, None)
-        assert get_transaction_type("***STT paid ***", None) == (TransactionType.STT_TAX, None)
-        assert get_transaction_type("***stamp duty***", None) == (
-            TransactionType.STAMP_DUTY_TAX,
-            None,
-        )
-        assert get_transaction_type("*** TDS on Above ***", None) == (TransactionType.TDS_TAX, None)
-        assert get_transaction_type("Creation of units - Segregated portfolio", Decimal(1.0)) == (
-            TransactionType.SEGREGATION,
-            None,
-        )
-        assert get_transaction_type("***Random text***", Decimal(0.0)) == (
-            TransactionType.UNKNOWN,
-            None,
-        )
-
-        assert get_transaction_type(
-            "Purchase SIPCheque Dishonoured - Instalment No 108", Decimal(-1.0)
-        ) == (TransactionType.REVERSAL, None)
-
-        assert parse_transaction(
-            "01-Jan-2021\t\tCreation of units - Segregated Portfolio\t\t1.000\t\t12,601.184"
-        ) == ParsedTransaction(
-            date="01-Jan-2021",
-            description="Creation of units - Segregated Portfolio",
-            units="1.000",
-            balance="12,601.184",
-            nav=None,
-            amount=None,
-        )
-
-        assert parse_transaction(
-            "01-Jan-2021\t\tIDCW Reinvestment @ Rs.0.003 per unit\t\t0.32\t\t\t\t1001.40\t\t12.34"
-        ) == ParsedTransaction(
-            date="01-Jan-2021",
-            description="IDCW Reinvestment @ Rs.0.003 per unit",
-            units="0.000",
-            balance="12.34",
-            nav="1001.40",
-            amount="0.32",
-        )
-
-    def test_dividend_transactions(self):
-        assert get_transaction_type("IDCW Reinvestment @ Rs.2.00 per unit", Decimal(1.0)) == (
-            TransactionType.DIVIDEND_REINVEST,
-            Decimal("2.00"),
-        )
-        assert get_transaction_type("IDCW Reinvested @ Rs.0.0241 per unit", Decimal(1.0)) == (
-            TransactionType.DIVIDEND_REINVEST,
-            Decimal("0.0241"),
-        )
-        assert get_transaction_type("IDCW Paid @ Rs.0.06 per unit", Decimal(1.0)) == (
-            TransactionType.DIVIDEND_PAYOUT,
-            Decimal("0.06"),
-        )
-        # assert get_transaction_type("***IDCW Payout***", None) == (
-        #     TransactionType.DIVIDEND_PAYOUT,
-        #     None,
-        # )
-        assert get_transaction_type("Div. Reinvested @ Rs.0.0241 per unit", Decimal(1.0)) == (
-            TransactionType.DIVIDEND_REINVEST,
-            Decimal("0.0241"),
-        )
-
-    def test_parsed_scheme_name(self):
-        assert (
-            get_parsed_scheme_name("Axis Long Term Equity Fund - Direct Growth")
-            == "Axis Long Term Equity Fund - Direct Growth"
-        )
-        assert (
-            get_parsed_scheme_name("Axis Bluechip Fund - Regular Growth ")
-            == "Axis Bluechip Fund - Regular Growth"
-        )
-        assert (
-            get_parsed_scheme_name(
-                "HSBC Corporate Bond Fund - Regular Growth "
-                "(Formerly known as L&T Triple Ace Bond Fund - Growth)"
-            )
-            == "HSBC Corporate Bond Fund - Regular Growth"
-        )
-        assert (
-            get_parsed_scheme_name(
-                "Bandhan ELSS Tax saver Fund-Growth-(Regular Plan)"
-                "(erstwhile Bandhan Tax Advantage ELSS Fund-Growth-Regular Plan)"
-            )
-            == "Bandhan ELSS Tax saver Fund-Growth-(Regular Plan)"
-        )
-        assert (
-            get_parsed_scheme_name(
-                "Bandhan Liquid Fund-Growth-(Regular Plan) "
-                "(erstwhile IDFC Cash Fund-Growth-Regular Plan) (Non-Demat) "
-            )
-            == "Bandhan Liquid Fund-Growth-(Regular Plan)"
-        )
-
-    def test_isin_search(self):
-        isin, amfi, scheme_type = isin_search(
-            "Axis Long Term Equity Fund - Direct Growth", "KFINTECH", "128TSDGG"
-        )
-        assert isin == "INF846K01EW2"
-        assert amfi == "120503"
-        assert scheme_type == "EQUITY"
-
-        isin, amfi, scheme_type = isin_search("", "KARVY", "")
-        assert isin is None
-        assert amfi is None
-        assert scheme_type is None
diff --git a/uv.lock b/uv.lock
index 9890e79..5ac7ad6 100644
--- a/uv.lock
+++ b/uv.lock
@@ -27,20 +27,12 @@ dependencies = [
     { name = "casparser-isin" },
     { name = "click" },
     { name = "colorama" },
-    { name = "pdfminer-six" },
     { name = "pydantic" },
+    { name = "pypdfium2" },
     { name = "python-dateutil" },
     { name = "rich" },
 ]
 
-[package.optional-dependencies]
-fast = [
-    { name = "pymupdf" },
-]
-mupdf = [
-    { name = "pymupdf" },
-]
-
 [package.dev-dependencies]
 dev = [
     { name = "coverage", extra = ["toml"] },
@@ -53,24 +45,21 @@ dev = [
 [package.metadata]
 requires-dist = [
     { name = "casparser-isin", specifier = ">=2026.5.1" },
-    { name = "click", specifier = ">=8.0,<9.0" },
+    { name = "click", specifier = ">=8.0,<10" },
     { name = "colorama", specifier = ">=0.4.6,<1" },
-    { name = "pdfminer-six", specifier = ">=20240706" },
     { name = "pydantic", specifier = ">=2.3.0,<3" },
-    { name = "pymupdf", marker = "extra == 'fast'", specifier = ">=1.25.0" },
-    { name = "pymupdf", marker = "extra == 'mupdf'", specifier = ">=1.25.0" },
+    { name = "pypdfium2", specifier = ">=5.0,<7" },
     { name = "python-dateutil", specifier = ">=2.8.2,<3" },
     { name = "rich", specifier = ">=13.5.2,<16" },
 ]
-provides-extras = ["fast", "mupdf"]
 
 [package.metadata.requires-dev]
 dev = [
-    { name = "coverage", extras = ["toml"], specifier = ">=7.3.0,<8" },
-    { name = "ipython", specifier = ">=8.31.0,<9" },
+    { name = "coverage", extras = ["toml"], specifier = ">=7.3.0,<9" },
+    { name = "ipython", specifier = ">=8.31.0" },
     { name = "pre-commit", specifier = ">=4.0.0,<5" },
     { name = "pytest", specifier = ">=8.0.0,<10" },
-    { name = "pytest-cov", specifier = "~=6.0.0" },
+    { name = "pytest-cov", specifier = ">=6.0,<8" },
 ]
 
 [[package]]
@@ -86,76 +75,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/23/89/b0dc213b033475bca7224b91040c68202dafda87d3ba5a3e5fe264e58f87/casparser_isin-2026.5.1-py3-none-any.whl", hash = "sha256:7b7386000dcfce5cfe31d6dd27f71b8e20c47ea56801a63b78636192cc3aee77", size = 9343316, upload-time = "2026-05-22T04:29:48.205Z" },
 ]
 
-[[package]]
-name = "cffi"
-version = "2.0.0"
-source = { registry = "https://pypi.org/simple" }
-dependencies = [
-    { name = "pycparser", marker = "implementation_name != 'PyPy'" },
-]
-sdist = { url = "https://files.pythonhosted.org/packages/eb/56/b1ba7935a17738ae8453301356628e8147c79dbb825bcbc73dc7401f9846/cffi-2.0.0.tar.gz", hash = "sha256:44d1b5909021139fe36001ae048dbdde8214afa20200eda0f64c068cac5d5529", size = 523588, upload-time = "2025-09-08T23:24:04.541Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/12/4a/3dfd5f7850cbf0d06dc84ba9aa00db766b52ca38d8b86e3a38314d52498c/cffi-2.0.0-cp311-cp311-macosx_10_13_x86_64.whl", hash = "sha256:b4c854ef3adc177950a8dfc81a86f5115d2abd545751a304c5bcf2c2c7283cfe", size = 184344, upload-time = "2025-09-08T23:22:26.456Z" },
-    { url = "https://files.pythonhosted.org/packages/4f/8b/f0e4c441227ba756aafbe78f117485b25bb26b1c059d01f137fa6d14896b/cffi-2.0.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:2de9a304e27f7596cd03d16f1b7c72219bd944e99cc52b84d0145aefb07cbd3c", size = 180560, upload-time = "2025-09-08T23:22:28.197Z" },
-    { url = "https://files.pythonhosted.org/packages/b1/b7/1200d354378ef52ec227395d95c2576330fd22a869f7a70e88e1447eb234/cffi-2.0.0-cp311-cp311-manylinux1_i686.manylinux2014_i686.manylinux_2_17_i686.manylinux_2_5_i686.whl", hash = "sha256:baf5215e0ab74c16e2dd324e8ec067ef59e41125d3eade2b863d294fd5035c92", size = 209613, upload-time = "2025-09-08T23:22:29.475Z" },
-    { url = "https://files.pythonhosted.org/packages/b8/56/6033f5e86e8cc9bb629f0077ba71679508bdf54a9a5e112a3c0b91870332/cffi-2.0.0-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:730cacb21e1bdff3ce90babf007d0a0917cc3e6492f336c2f0134101e0944f93", size = 216476, upload-time = "2025-09-08T23:22:31.063Z" },
-    { url = "https://files.pythonhosted.org/packages/dc/7f/55fecd70f7ece178db2f26128ec41430d8720f2d12ca97bf8f0a628207d5/cffi-2.0.0-cp311-cp311-manylinux2014_ppc64le.manylinux_2_17_ppc64le.whl", hash = "sha256:6824f87845e3396029f3820c206e459ccc91760e8fa24422f8b0c3d1731cbec5", size = 203374, upload-time = "2025-09-08T23:22:32.507Z" },
-    { url = "https://files.pythonhosted.org/packages/84/ef/a7b77c8bdc0f77adc3b46888f1ad54be8f3b7821697a7b89126e829e676a/cffi-2.0.0-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.whl", hash = "sha256:9de40a7b0323d889cf8d23d1ef214f565ab154443c42737dfe52ff82cf857664", size = 202597, upload-time = "2025-09-08T23:22:34.132Z" },
-    { url = "https://files.pythonhosted.org/packages/d7/91/500d892b2bf36529a75b77958edfcd5ad8e2ce4064ce2ecfeab2125d72d1/cffi-2.0.0-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:8941aaadaf67246224cee8c3803777eed332a19d909b47e29c9842ef1e79ac26", size = 215574, upload-time = "2025-09-08T23:22:35.443Z" },
-    { url = "https://files.pythonhosted.org/packages/44/64/58f6255b62b101093d5df22dcb752596066c7e89dd725e0afaed242a61be/cffi-2.0.0-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:a05d0c237b3349096d3981b727493e22147f934b20f6f125a3eba8f994bec4a9", size = 218971, upload-time = "2025-09-08T23:22:36.805Z" },
-    { url = "https://files.pythonhosted.org/packages/ab/49/fa72cebe2fd8a55fbe14956f9970fe8eb1ac59e5df042f603ef7c8ba0adc/cffi-2.0.0-cp311-cp311-musllinux_1_2_i686.whl", hash = "sha256:94698a9c5f91f9d138526b48fe26a199609544591f859c870d477351dc7b2414", size = 211972, upload-time = "2025-09-08T23:22:38.436Z" },
-    { url = "https://files.pythonhosted.org/packages/0b/28/dd0967a76aab36731b6ebfe64dec4e981aff7e0608f60c2d46b46982607d/cffi-2.0.0-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:5fed36fccc0612a53f1d4d9a816b50a36702c28a2aa880cb8a122b3466638743", size = 217078, upload-time = "2025-09-08T23:22:39.776Z" },
-    { url = "https://files.pythonhosted.org/packages/2b/c0/015b25184413d7ab0a410775fdb4a50fca20f5589b5dab1dbbfa3baad8ce/cffi-2.0.0-cp311-cp311-win32.whl", hash = "sha256:c649e3a33450ec82378822b3dad03cc228b8f5963c0c12fc3b1e0ab940f768a5", size = 172076, upload-time = "2025-09-08T23:22:40.95Z" },
-    { url = "https://files.pythonhosted.org/packages/ae/8f/dc5531155e7070361eb1b7e4c1a9d896d0cb21c49f807a6c03fd63fc877e/cffi-2.0.0-cp311-cp311-win_amd64.whl", hash = "sha256:66f011380d0e49ed280c789fbd08ff0d40968ee7b665575489afa95c98196ab5", size = 182820, upload-time = "2025-09-08T23:22:42.463Z" },
-    { url = "https://files.pythonhosted.org/packages/95/5c/1b493356429f9aecfd56bc171285a4c4ac8697f76e9bbbbb105e537853a1/cffi-2.0.0-cp311-cp311-win_arm64.whl", hash = "sha256:c6638687455baf640e37344fe26d37c404db8b80d037c3d29f58fe8d1c3b194d", size = 177635, upload-time = "2025-09-08T23:22:43.623Z" },
-    { url = "https://files.pythonhosted.org/packages/ea/47/4f61023ea636104d4f16ab488e268b93008c3d0bb76893b1b31db1f96802/cffi-2.0.0-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:6d02d6655b0e54f54c4ef0b94eb6be0607b70853c45ce98bd278dc7de718be5d", size = 185271, upload-time = "2025-09-08T23:22:44.795Z" },
-    { url = "https://files.pythonhosted.org/packages/df/a2/781b623f57358e360d62cdd7a8c681f074a71d445418a776eef0aadb4ab4/cffi-2.0.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:8eca2a813c1cb7ad4fb74d368c2ffbbb4789d377ee5bb8df98373c2cc0dee76c", size = 181048, upload-time = "2025-09-08T23:22:45.938Z" },
-    { url = "https://files.pythonhosted.org/packages/ff/df/a4f0fbd47331ceeba3d37c2e51e9dfc9722498becbeec2bd8bc856c9538a/cffi-2.0.0-cp312-cp312-manylinux1_i686.manylinux2014_i686.manylinux_2_17_i686.manylinux_2_5_i686.whl", hash = "sha256:21d1152871b019407d8ac3985f6775c079416c282e431a4da6afe7aefd2bccbe", size = 212529, upload-time = "2025-09-08T23:22:47.349Z" },
-    { url = "https://files.pythonhosted.org/packages/d5/72/12b5f8d3865bf0f87cf1404d8c374e7487dcf097a1c91c436e72e6badd83/cffi-2.0.0-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:b21e08af67b8a103c71a250401c78d5e0893beff75e28c53c98f4de42f774062", size = 220097, upload-time = "2025-09-08T23:22:48.677Z" },
-    { url = "https://files.pythonhosted.org/packages/c2/95/7a135d52a50dfa7c882ab0ac17e8dc11cec9d55d2c18dda414c051c5e69e/cffi-2.0.0-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.whl", hash = "sha256:1e3a615586f05fc4065a8b22b8152f0c1b00cdbc60596d187c2a74f9e3036e4e", size = 207983, upload-time = "2025-09-08T23:22:50.06Z" },
-    { url = "https://files.pythonhosted.org/packages/3a/c8/15cb9ada8895957ea171c62dc78ff3e99159ee7adb13c0123c001a2546c1/cffi-2.0.0-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.whl", hash = "sha256:81afed14892743bbe14dacb9e36d9e0e504cd204e0b165062c488942b9718037", size = 206519, upload-time = "2025-09-08T23:22:51.364Z" },
-    { url = "https://files.pythonhosted.org/packages/78/2d/7fa73dfa841b5ac06c7b8855cfc18622132e365f5b81d02230333ff26e9e/cffi-2.0.0-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:3e17ed538242334bf70832644a32a7aae3d83b57567f9fd60a26257e992b79ba", size = 219572, upload-time = "2025-09-08T23:22:52.902Z" },
-    { url = "https://files.pythonhosted.org/packages/07/e0/267e57e387b4ca276b90f0434ff88b2c2241ad72b16d31836adddfd6031b/cffi-2.0.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:3925dd22fa2b7699ed2617149842d2e6adde22b262fcbfada50e3d195e4b3a94", size = 222963, upload-time = "2025-09-08T23:22:54.518Z" },
-    { url = "https://files.pythonhosted.org/packages/b6/75/1f2747525e06f53efbd878f4d03bac5b859cbc11c633d0fb81432d98a795/cffi-2.0.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:2c8f814d84194c9ea681642fd164267891702542f028a15fc97d4674b6206187", size = 221361, upload-time = "2025-09-08T23:22:55.867Z" },
-    { url = "https://files.pythonhosted.org/packages/7b/2b/2b6435f76bfeb6bbf055596976da087377ede68df465419d192acf00c437/cffi-2.0.0-cp312-cp312-win32.whl", hash = "sha256:da902562c3e9c550df360bfa53c035b2f241fed6d9aef119048073680ace4a18", size = 172932, upload-time = "2025-09-08T23:22:57.188Z" },
-    { url = "https://files.pythonhosted.org/packages/f8/ed/13bd4418627013bec4ed6e54283b1959cf6db888048c7cf4b4c3b5b36002/cffi-2.0.0-cp312-cp312-win_amd64.whl", hash = "sha256:da68248800ad6320861f129cd9c1bf96ca849a2771a59e0344e88681905916f5", size = 183557, upload-time = "2025-09-08T23:22:58.351Z" },
-    { url = "https://files.pythonhosted.org/packages/95/31/9f7f93ad2f8eff1dbc1c3656d7ca5bfd8fb52c9d786b4dcf19b2d02217fa/cffi-2.0.0-cp312-cp312-win_arm64.whl", hash = "sha256:4671d9dd5ec934cb9a73e7ee9676f9362aba54f7f34910956b84d727b0d73fb6", size = 177762, upload-time = "2025-09-08T23:22:59.668Z" },
-    { url = "https://files.pythonhosted.org/packages/4b/8d/a0a47a0c9e413a658623d014e91e74a50cdd2c423f7ccfd44086ef767f90/cffi-2.0.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:00bdf7acc5f795150faa6957054fbbca2439db2f775ce831222b66f192f03beb", size = 185230, upload-time = "2025-09-08T23:23:00.879Z" },
-    { url = "https://files.pythonhosted.org/packages/4a/d2/a6c0296814556c68ee32009d9c2ad4f85f2707cdecfd7727951ec228005d/cffi-2.0.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:45d5e886156860dc35862657e1494b9bae8dfa63bf56796f2fb56e1679fc0bca", size = 181043, upload-time = "2025-09-08T23:23:02.231Z" },
-    { url = "https://files.pythonhosted.org/packages/b0/1e/d22cc63332bd59b06481ceaac49d6c507598642e2230f201649058a7e704/cffi-2.0.0-cp313-cp313-manylinux1_i686.manylinux2014_i686.manylinux_2_17_i686.manylinux_2_5_i686.whl", hash = "sha256:07b271772c100085dd28b74fa0cd81c8fb1a3ba18b21e03d7c27f3436a10606b", size = 212446, upload-time = "2025-09-08T23:23:03.472Z" },
-    { url = "https://files.pythonhosted.org/packages/a9/f5/a2c23eb03b61a0b8747f211eb716446c826ad66818ddc7810cc2cc19b3f2/cffi-2.0.0-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:d48a880098c96020b02d5a1f7d9251308510ce8858940e6fa99ece33f610838b", size = 220101, upload-time = "2025-09-08T23:23:04.792Z" },
-    { url = "https://files.pythonhosted.org/packages/f2/7f/e6647792fc5850d634695bc0e6ab4111ae88e89981d35ac269956605feba/cffi-2.0.0-cp313-cp313-manylinux2014_ppc64le.manylinux_2_17_ppc64le.whl", hash = "sha256:f93fd8e5c8c0a4aa1f424d6173f14a892044054871c771f8566e4008eaa359d2", size = 207948, upload-time = "2025-09-08T23:23:06.127Z" },
-    { url = "https://files.pythonhosted.org/packages/cb/1e/a5a1bd6f1fb30f22573f76533de12a00bf274abcdc55c8edab639078abb6/cffi-2.0.0-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.whl", hash = "sha256:dd4f05f54a52fb558f1ba9f528228066954fee3ebe629fc1660d874d040ae5a3", size = 206422, upload-time = "2025-09-08T23:23:07.753Z" },
-    { url = "https://files.pythonhosted.org/packages/98/df/0a1755e750013a2081e863e7cd37e0cdd02664372c754e5560099eb7aa44/cffi-2.0.0-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:c8d3b5532fc71b7a77c09192b4a5a200ea992702734a2e9279a37f2478236f26", size = 219499, upload-time = "2025-09-08T23:23:09.648Z" },
-    { url = "https://files.pythonhosted.org/packages/50/e1/a969e687fcf9ea58e6e2a928ad5e2dd88cc12f6f0ab477e9971f2309b57c/cffi-2.0.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:d9b29c1f0ae438d5ee9acb31cadee00a58c46cc9c0b2f9038c6b0b3470877a8c", size = 222928, upload-time = "2025-09-08T23:23:10.928Z" },
-    { url = "https://files.pythonhosted.org/packages/36/54/0362578dd2c9e557a28ac77698ed67323ed5b9775ca9d3fe73fe191bb5d8/cffi-2.0.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:6d50360be4546678fc1b79ffe7a66265e28667840010348dd69a314145807a1b", size = 221302, upload-time = "2025-09-08T23:23:12.42Z" },
-    { url = "https://files.pythonhosted.org/packages/eb/6d/bf9bda840d5f1dfdbf0feca87fbdb64a918a69bca42cfa0ba7b137c48cb8/cffi-2.0.0-cp313-cp313-win32.whl", hash = "sha256:74a03b9698e198d47562765773b4a8309919089150a0bb17d829ad7b44b60d27", size = 172909, upload-time = "2025-09-08T23:23:14.32Z" },
-    { url = "https://files.pythonhosted.org/packages/37/18/6519e1ee6f5a1e579e04b9ddb6f1676c17368a7aba48299c3759bbc3c8b3/cffi-2.0.0-cp313-cp313-win_amd64.whl", hash = "sha256:19f705ada2530c1167abacb171925dd886168931e0a7b78f5bffcae5c6b5be75", size = 183402, upload-time = "2025-09-08T23:23:15.535Z" },
-    { url = "https://files.pythonhosted.org/packages/cb/0e/02ceeec9a7d6ee63bb596121c2c8e9b3a9e150936f4fbef6ca1943e6137c/cffi-2.0.0-cp313-cp313-win_arm64.whl", hash = "sha256:256f80b80ca3853f90c21b23ee78cd008713787b1b1e93eae9f3d6a7134abd91", size = 177780, upload-time = "2025-09-08T23:23:16.761Z" },
-    { url = "https://files.pythonhosted.org/packages/92/c4/3ce07396253a83250ee98564f8d7e9789fab8e58858f35d07a9a2c78de9f/cffi-2.0.0-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:fc33c5141b55ed366cfaad382df24fe7dcbc686de5be719b207bb248e3053dc5", size = 185320, upload-time = "2025-09-08T23:23:18.087Z" },
-    { url = "https://files.pythonhosted.org/packages/59/dd/27e9fa567a23931c838c6b02d0764611c62290062a6d4e8ff7863daf9730/cffi-2.0.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:c654de545946e0db659b3400168c9ad31b5d29593291482c43e3564effbcee13", size = 181487, upload-time = "2025-09-08T23:23:19.622Z" },
-    { url = "https://files.pythonhosted.org/packages/d6/43/0e822876f87ea8a4ef95442c3d766a06a51fc5298823f884ef87aaad168c/cffi-2.0.0-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:24b6f81f1983e6df8db3adc38562c83f7d4a0c36162885ec7f7b77c7dcbec97b", size = 220049, upload-time = "2025-09-08T23:23:20.853Z" },
-    { url = "https://files.pythonhosted.org/packages/b4/89/76799151d9c2d2d1ead63c2429da9ea9d7aac304603de0c6e8764e6e8e70/cffi-2.0.0-cp314-cp314-manylinux2014_ppc64le.manylinux_2_17_ppc64le.whl", hash = "sha256:12873ca6cb9b0f0d3a0da705d6086fe911591737a59f28b7936bdfed27c0d47c", size = 207793, upload-time = "2025-09-08T23:23:22.08Z" },
-    { url = "https://files.pythonhosted.org/packages/bb/dd/3465b14bb9e24ee24cb88c9e3730f6de63111fffe513492bf8c808a3547e/cffi-2.0.0-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.whl", hash = "sha256:d9b97165e8aed9272a6bb17c01e3cc5871a594a446ebedc996e2397a1c1ea8ef", size = 206300, upload-time = "2025-09-08T23:23:23.314Z" },
-    { url = "https://files.pythonhosted.org/packages/47/d9/d83e293854571c877a92da46fdec39158f8d7e68da75bf73581225d28e90/cffi-2.0.0-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:afb8db5439b81cf9c9d0c80404b60c3cc9c3add93e114dcae767f1477cb53775", size = 219244, upload-time = "2025-09-08T23:23:24.541Z" },
-    { url = "https://files.pythonhosted.org/packages/2b/0f/1f177e3683aead2bb00f7679a16451d302c436b5cbf2505f0ea8146ef59e/cffi-2.0.0-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:737fe7d37e1a1bffe70bd5754ea763a62a066dc5913ca57e957824b72a85e205", size = 222828, upload-time = "2025-09-08T23:23:26.143Z" },
-    { url = "https://files.pythonhosted.org/packages/c6/0f/cafacebd4b040e3119dcb32fed8bdef8dfe94da653155f9d0b9dc660166e/cffi-2.0.0-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:38100abb9d1b1435bc4cc340bb4489635dc2f0da7456590877030c9b3d40b0c1", size = 220926, upload-time = "2025-09-08T23:23:27.873Z" },
-    { url = "https://files.pythonhosted.org/packages/3e/aa/df335faa45b395396fcbc03de2dfcab242cd61a9900e914fe682a59170b1/cffi-2.0.0-cp314-cp314-win32.whl", hash = "sha256:087067fa8953339c723661eda6b54bc98c5625757ea62e95eb4898ad5e776e9f", size = 175328, upload-time = "2025-09-08T23:23:44.61Z" },
-    { url = "https://files.pythonhosted.org/packages/bb/92/882c2d30831744296ce713f0feb4c1cd30f346ef747b530b5318715cc367/cffi-2.0.0-cp314-cp314-win_amd64.whl", hash = "sha256:203a48d1fb583fc7d78a4c6655692963b860a417c0528492a6bc21f1aaefab25", size = 185650, upload-time = "2025-09-08T23:23:45.848Z" },
-    { url = "https://files.pythonhosted.org/packages/9f/2c/98ece204b9d35a7366b5b2c6539c350313ca13932143e79dc133ba757104/cffi-2.0.0-cp314-cp314-win_arm64.whl", hash = "sha256:dbd5c7a25a7cb98f5ca55d258b103a2054f859a46ae11aaf23134f9cc0d356ad", size = 180687, upload-time = "2025-09-08T23:23:47.105Z" },
-    { url = "https://files.pythonhosted.org/packages/3e/61/c768e4d548bfa607abcda77423448df8c471f25dbe64fb2ef6d555eae006/cffi-2.0.0-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:9a67fc9e8eb39039280526379fb3a70023d77caec1852002b4da7e8b270c4dd9", size = 188773, upload-time = "2025-09-08T23:23:29.347Z" },
-    { url = "https://files.pythonhosted.org/packages/2c/ea/5f76bce7cf6fcd0ab1a1058b5af899bfbef198bea4d5686da88471ea0336/cffi-2.0.0-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:7a66c7204d8869299919db4d5069a82f1561581af12b11b3c9f48c584eb8743d", size = 185013, upload-time = "2025-09-08T23:23:30.63Z" },
-    { url = "https://files.pythonhosted.org/packages/be/b4/c56878d0d1755cf9caa54ba71e5d049479c52f9e4afc230f06822162ab2f/cffi-2.0.0-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:7cc09976e8b56f8cebd752f7113ad07752461f48a58cbba644139015ac24954c", size = 221593, upload-time = "2025-09-08T23:23:31.91Z" },
-    { url = "https://files.pythonhosted.org/packages/e0/0d/eb704606dfe8033e7128df5e90fee946bbcb64a04fcdaa97321309004000/cffi-2.0.0-cp314-cp314t-manylinux2014_ppc64le.manylinux_2_17_ppc64le.whl", hash = "sha256:92b68146a71df78564e4ef48af17551a5ddd142e5190cdf2c5624d0c3ff5b2e8", size = 209354, upload-time = "2025-09-08T23:23:33.214Z" },
-    { url = "https://files.pythonhosted.org/packages/d8/19/3c435d727b368ca475fb8742ab97c9cb13a0de600ce86f62eab7fa3eea60/cffi-2.0.0-cp314-cp314t-manylinux2014_s390x.manylinux_2_17_s390x.whl", hash = "sha256:b1e74d11748e7e98e2f426ab176d4ed720a64412b6a15054378afdb71e0f37dc", size = 208480, upload-time = "2025-09-08T23:23:34.495Z" },
-    { url = "https://files.pythonhosted.org/packages/d0/44/681604464ed9541673e486521497406fadcc15b5217c3e326b061696899a/cffi-2.0.0-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:28a3a209b96630bca57cce802da70c266eb08c6e97e5afd61a75611ee6c64592", size = 221584, upload-time = "2025-09-08T23:23:36.096Z" },
-    { url = "https://files.pythonhosted.org/packages/25/8e/342a504ff018a2825d395d44d63a767dd8ebc927ebda557fecdaca3ac33a/cffi-2.0.0-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:7553fb2090d71822f02c629afe6042c299edf91ba1bf94951165613553984512", size = 224443, upload-time = "2025-09-08T23:23:37.328Z" },
-    { url = "https://files.pythonhosted.org/packages/e1/5e/b666bacbbc60fbf415ba9988324a132c9a7a0448a9a8f125074671c0f2c3/cffi-2.0.0-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:6c6c373cfc5c83a975506110d17457138c8c63016b563cc9ed6e056a82f13ce4", size = 223437, upload-time = "2025-09-08T23:23:38.945Z" },
-    { url = "https://files.pythonhosted.org/packages/a0/1d/ec1a60bd1a10daa292d3cd6bb0b359a81607154fb8165f3ec95fe003b85c/cffi-2.0.0-cp314-cp314t-win32.whl", hash = "sha256:1fc9ea04857caf665289b7a75923f2c6ed559b8298a1b8c49e59f7dd95c8481e", size = 180487, upload-time = "2025-09-08T23:23:40.423Z" },
-    { url = "https://files.pythonhosted.org/packages/bf/41/4c1168c74fac325c0c8156f04b6749c8b6a8f405bbf91413ba088359f60d/cffi-2.0.0-cp314-cp314t-win_amd64.whl", hash = "sha256:d68b6cef7827e8641e8ef16f4494edda8b36104d79773a334beaa1e3521430f6", size = 191726, upload-time = "2025-09-08T23:23:41.742Z" },
-    { url = "https://files.pythonhosted.org/packages/ae/3a/dbeec9d1ee0844c679f6bb5d6ad4e9f198b1224f4e7a32825f47f6192b0c/cffi-2.0.0-cp314-cp314t-win_arm64.whl", hash = "sha256:0a1527a803f0a659de1af2e1fd700213caba79377e27e4693648c2923da066f9", size = 184195, upload-time = "2025-09-08T23:23:43.004Z" },
-]
-
 [[package]]
 name = "cfgv"
 version = "3.5.0"
@@ -165,95 +84,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/db/3c/33bac158f8ab7f89b2e59426d5fe2e4f63f7ed25df84c036890172b412b5/cfgv-3.5.0-py2.py3-none-any.whl", hash = "sha256:a8dc6b26ad22ff227d2634a65cb388215ce6cc96bbcc5cfde7641ae87e8dacc0", size = 7445, upload-time = "2025-11-19T20:55:50.744Z" },
 ]
 
-[[package]]
-name = "charset-normalizer"
-version = "3.4.7"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/e7/a1/67fe25fac3c7642725500a3f6cfe5821ad557c3abb11c9d20d12c7008d3e/charset_normalizer-3.4.7.tar.gz", hash = "sha256:ae89db9e5f98a11a4bf50407d4363e7b09b31e55bc117b4f7d80aab97ba009e5", size = 144271, upload-time = "2026-04-02T09:28:39.342Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/c2/d7/b5b7020a0565c2e9fa8c09f4b5fa6232feb326b8c20081ccded47ea368fd/charset_normalizer-3.4.7-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:7641bb8895e77f921102f72833904dcd9901df5d6d72a2ab8f31d04b7e51e4e7", size = 309705, upload-time = "2026-04-02T09:26:02.191Z" },
-    { url = "https://files.pythonhosted.org/packages/5a/53/58c29116c340e5456724ecd2fff4196d236b98f3da97b404bc5e51ac3493/charset_normalizer-3.4.7-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:202389074300232baeb53ae2569a60901f7efadd4245cf3a3bf0617d60b439d7", size = 206419, upload-time = "2026-04-02T09:26:03.583Z" },
-    { url = "https://files.pythonhosted.org/packages/b2/02/e8146dc6591a37a00e5144c63f29fb7c97a734ea8a111190783c0e60ab63/charset_normalizer-3.4.7-cp311-cp311-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:30b8d1d8c52a48c2c5690e152c169b673487a2a58de1ec7393196753063fcd5e", size = 227901, upload-time = "2026-04-02T09:26:04.738Z" },
-    { url = "https://files.pythonhosted.org/packages/fb/73/77486c4cd58f1267bf17db420e930c9afa1b3be3fe8c8b8ebbebc9624359/charset_normalizer-3.4.7-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:532bc9bf33a68613fd7d65e4b1c71a6a38d7d42604ecf239c77392e9b4e8998c", size = 222742, upload-time = "2026-04-02T09:26:06.36Z" },
-    { url = "https://files.pythonhosted.org/packages/a1/fa/f74eb381a7d94ded44739e9d94de18dc5edc9c17fb8c11f0a6890696c0a9/charset_normalizer-3.4.7-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:2fe249cb4651fd12605b7288b24751d8bfd46d35f12a20b1ba33dea122e690df", size = 214061, upload-time = "2026-04-02T09:26:08.347Z" },
-    { url = "https://files.pythonhosted.org/packages/dc/92/42bd3cefcf7687253fb86694b45f37b733c97f59af3724f356fa92b8c344/charset_normalizer-3.4.7-cp311-cp311-manylinux_2_31_armv7l.whl", hash = "sha256:65bcd23054beab4d166035cabbc868a09c1a49d1efe458fe8e4361215df40265", size = 199239, upload-time = "2026-04-02T09:26:09.823Z" },
-    { url = "https://files.pythonhosted.org/packages/4c/3d/069e7184e2aa3b3cddc700e3dd267413dc259854adc3380421c805c6a17d/charset_normalizer-3.4.7-cp311-cp311-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:08e721811161356f97b4059a9ba7bafb23ea5ee2255402c42881c214e173c6b4", size = 210173, upload-time = "2026-04-02T09:26:10.953Z" },
-    { url = "https://files.pythonhosted.org/packages/62/51/9d56feb5f2e7074c46f93e0ebdbe61f0848ee246e2f0d89f8e20b89ebb8f/charset_normalizer-3.4.7-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:e060d01aec0a910bdccb8be71faf34e7799ce36950f8294c8bf612cba65a2c9e", size = 209841, upload-time = "2026-04-02T09:26:12.142Z" },
-    { url = "https://files.pythonhosted.org/packages/d2/59/893d8f99cc4c837dda1fe2f1139079703deb9f321aabcb032355de13b6c7/charset_normalizer-3.4.7-cp311-cp311-musllinux_1_2_armv7l.whl", hash = "sha256:38c0109396c4cfc574d502df99742a45c72c08eff0a36158b6f04000043dbf38", size = 200304, upload-time = "2026-04-02T09:26:13.711Z" },
-    { url = "https://files.pythonhosted.org/packages/7d/1d/ee6f3be3464247578d1ed5c46de545ccc3d3ff933695395c402c21fa6b77/charset_normalizer-3.4.7-cp311-cp311-musllinux_1_2_ppc64le.whl", hash = "sha256:1c2a768fdd44ee4a9339a9b0b130049139b8ce3c01d2ce09f67f5a68048d477c", size = 229455, upload-time = "2026-04-02T09:26:14.941Z" },
-    { url = "https://files.pythonhosted.org/packages/54/bb/8fb0a946296ea96a488928bdce8ef99023998c48e4713af533e9bb98ef07/charset_normalizer-3.4.7-cp311-cp311-musllinux_1_2_riscv64.whl", hash = "sha256:1a87ca9d5df6fe460483d9a5bbf2b18f620cbed41b432e2bddb686228282d10b", size = 210036, upload-time = "2026-04-02T09:26:16.478Z" },
-    { url = "https://files.pythonhosted.org/packages/9a/bc/015b2387f913749f82afd4fcba07846d05b6d784dd16123cb66860e0237d/charset_normalizer-3.4.7-cp311-cp311-musllinux_1_2_s390x.whl", hash = "sha256:d635aab80466bc95771bb78d5370e74d36d1fe31467b6b29b8b57b2a3cd7d22c", size = 224739, upload-time = "2026-04-02T09:26:17.751Z" },
-    { url = "https://files.pythonhosted.org/packages/17/ab/63133691f56baae417493cba6b7c641571a2130eb7bceba6773367ab9ec5/charset_normalizer-3.4.7-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:ae196f021b5e7c78e918242d217db021ed2a6ace2bc6ae94c0fc596221c7f58d", size = 216277, upload-time = "2026-04-02T09:26:18.981Z" },
-    { url = "https://files.pythonhosted.org/packages/06/6d/3be70e827977f20db77c12a97e6a9f973631a45b8d186c084527e53e77a4/charset_normalizer-3.4.7-cp311-cp311-win32.whl", hash = "sha256:adb2597b428735679446b46c8badf467b4ca5f5056aae4d51a19f9570301b1ad", size = 147819, upload-time = "2026-04-02T09:26:20.295Z" },
-    { url = "https://files.pythonhosted.org/packages/20/d9/5f67790f06b735d7c7637171bbfd89882ad67201891b7275e51116ed8207/charset_normalizer-3.4.7-cp311-cp311-win_amd64.whl", hash = "sha256:8e385e4267ab76874ae30db04c627faaaf0b509e1ccc11a95b3fc3e83f855c00", size = 159281, upload-time = "2026-04-02T09:26:21.74Z" },
-    { url = "https://files.pythonhosted.org/packages/ca/83/6413f36c5a34afead88ce6f66684d943d91f233d76dd083798f9602b75ae/charset_normalizer-3.4.7-cp311-cp311-win_arm64.whl", hash = "sha256:d4a48e5b3c2a489fae013b7589308a40146ee081f6f509e047e0e096084ceca1", size = 147843, upload-time = "2026-04-02T09:26:22.901Z" },
-    { url = "https://files.pythonhosted.org/packages/0c/eb/4fc8d0a7110eb5fc9cc161723a34a8a6c200ce3b4fbf681bc86feee22308/charset_normalizer-3.4.7-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:eca9705049ad3c7345d574e3510665cb2cf844c2f2dcfe675332677f081cbd46", size = 311328, upload-time = "2026-04-02T09:26:24.331Z" },
-    { url = "https://files.pythonhosted.org/packages/f8/e3/0fadc706008ac9d7b9b5be6dc767c05f9d3e5df51744ce4cc9605de7b9f4/charset_normalizer-3.4.7-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:6178f72c5508bfc5fd446a5905e698c6212932f25bcdd4b47a757a50605a90e2", size = 208061, upload-time = "2026-04-02T09:26:25.568Z" },
-    { url = "https://files.pythonhosted.org/packages/42/f0/3dd1045c47f4a4604df85ec18ad093912ae1344ac706993aff91d38773a2/charset_normalizer-3.4.7-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:e1421b502d83040e6d7fb2fb18dff63957f720da3d77b2fbd3187ceb63755d7b", size = 229031, upload-time = "2026-04-02T09:26:26.865Z" },
-    { url = "https://files.pythonhosted.org/packages/dc/67/675a46eb016118a2fbde5a277a5d15f4f69d5f3f5f338e5ee2f8948fcf43/charset_normalizer-3.4.7-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:edac0f1ab77644605be2cbba52e6b7f630731fc42b34cb0f634be1a6eface56a", size = 225239, upload-time = "2026-04-02T09:26:28.044Z" },
-    { url = "https://files.pythonhosted.org/packages/4b/f8/d0118a2f5f23b02cd166fa385c60f9b0d4f9194f574e2b31cef350ad7223/charset_normalizer-3.4.7-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:5649fd1c7bade02f320a462fdefd0b4bd3ce036065836d4f42e0de958038e116", size = 216589, upload-time = "2026-04-02T09:26:29.239Z" },
-    { url = "https://files.pythonhosted.org/packages/b1/f1/6d2b0b261b6c4ceef0fcb0d17a01cc5bc53586c2d4796fa04b5c540bc13d/charset_normalizer-3.4.7-cp312-cp312-manylinux_2_31_armv7l.whl", hash = "sha256:203104ed3e428044fd943bc4bf45fa73c0730391f9621e37fe39ecf477b128cb", size = 202733, upload-time = "2026-04-02T09:26:30.5Z" },
-    { url = "https://files.pythonhosted.org/packages/6f/c0/7b1f943f7e87cc3db9626ba17807d042c38645f0a1d4415c7a14afb5591f/charset_normalizer-3.4.7-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:298930cec56029e05497a76988377cbd7457ba864beeea92ad7e844fe74cd1f1", size = 212652, upload-time = "2026-04-02T09:26:31.709Z" },
-    { url = "https://files.pythonhosted.org/packages/38/dd/5a9ab159fe45c6e72079398f277b7d2b523e7f716acc489726115a910097/charset_normalizer-3.4.7-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:708838739abf24b2ceb208d0e22403dd018faeef86ddac04319a62ae884c4f15", size = 211229, upload-time = "2026-04-02T09:26:33.282Z" },
-    { url = "https://files.pythonhosted.org/packages/d5/ff/531a1cad5ca855d1c1a8b69cb71abfd6d85c0291580146fda7c82857caa1/charset_normalizer-3.4.7-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:0f7eb884681e3938906ed0434f20c63046eacd0111c4ba96f27b76084cd679f5", size = 203552, upload-time = "2026-04-02T09:26:34.845Z" },
-    { url = "https://files.pythonhosted.org/packages/c1/4c/a5fb52d528a8ca41f7598cb619409ece30a169fbdf9cdce592e53b46c3a6/charset_normalizer-3.4.7-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:4dc1e73c36828f982bfe79fadf5919923f8a6f4df2860804db9a98c48824ce8d", size = 230806, upload-time = "2026-04-02T09:26:36.152Z" },
-    { url = "https://files.pythonhosted.org/packages/59/7a/071feed8124111a32b316b33ae4de83d36923039ef8cf48120266844285b/charset_normalizer-3.4.7-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:aed52fea0513bac0ccde438c188c8a471c4e0f457c2dd20cdbf6ea7a450046c7", size = 212316, upload-time = "2026-04-02T09:26:37.672Z" },
-    { url = "https://files.pythonhosted.org/packages/fd/35/f7dba3994312d7ba508e041eaac39a36b120f32d4c8662b8814dab876431/charset_normalizer-3.4.7-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:fea24543955a6a729c45a73fe90e08c743f0b3334bbf3201e6c4bc1b0c7fa464", size = 227274, upload-time = "2026-04-02T09:26:38.93Z" },
-    { url = "https://files.pythonhosted.org/packages/8a/2d/a572df5c9204ab7688ec1edc895a73ebded3b023bb07364710b05dd1c9be/charset_normalizer-3.4.7-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:bb6d88045545b26da47aa879dd4a89a71d1dce0f0e549b1abcb31dfe4a8eac49", size = 218468, upload-time = "2026-04-02T09:26:40.17Z" },
-    { url = "https://files.pythonhosted.org/packages/86/eb/890922a8b03a568ca2f336c36585a4713c55d4d67bf0f0c78924be6315ca/charset_normalizer-3.4.7-cp312-cp312-win32.whl", hash = "sha256:2257141f39fe65a3fdf38aeccae4b953e5f3b3324f4ff0daf9f15b8518666a2c", size = 148460, upload-time = "2026-04-02T09:26:41.416Z" },
-    { url = "https://files.pythonhosted.org/packages/35/d9/0e7dffa06c5ab081f75b1b786f0aefc88365825dfcd0ac544bdb7b2b6853/charset_normalizer-3.4.7-cp312-cp312-win_amd64.whl", hash = "sha256:5ed6ab538499c8644b8a3e18debabcd7ce684f3fa91cf867521a7a0279cab2d6", size = 159330, upload-time = "2026-04-02T09:26:42.554Z" },
-    { url = "https://files.pythonhosted.org/packages/9e/5d/481bcc2a7c88ea6b0878c299547843b2521ccbc40980cb406267088bc701/charset_normalizer-3.4.7-cp312-cp312-win_arm64.whl", hash = "sha256:56be790f86bfb2c98fb742ce566dfb4816e5a83384616ab59c49e0604d49c51d", size = 147828, upload-time = "2026-04-02T09:26:44.075Z" },
-    { url = "https://files.pythonhosted.org/packages/c1/3b/66777e39d3ae1ddc77ee606be4ec6d8cbd4c801f65e5a1b6f2b11b8346dd/charset_normalizer-3.4.7-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:f496c9c3cc02230093d8330875c4c3cdfc3b73612a5fd921c65d39cbcef08063", size = 309627, upload-time = "2026-04-02T09:26:45.198Z" },
-    { url = "https://files.pythonhosted.org/packages/2e/4e/b7f84e617b4854ade48a1b7915c8ccfadeba444d2a18c291f696e37f0d3b/charset_normalizer-3.4.7-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:0ea948db76d31190bf08bd371623927ee1339d5f2a0b4b1b4a4439a65298703c", size = 207008, upload-time = "2026-04-02T09:26:46.824Z" },
-    { url = "https://files.pythonhosted.org/packages/c4/bb/ec73c0257c9e11b268f018f068f5d00aa0ef8c8b09f7753ebd5f2880e248/charset_normalizer-3.4.7-cp313-cp313-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:a277ab8928b9f299723bc1a2dabb1265911b1a76341f90a510368ca44ad9ab66", size = 228303, upload-time = "2026-04-02T09:26:48.397Z" },
-    { url = "https://files.pythonhosted.org/packages/85/fb/32d1f5033484494619f701e719429c69b766bfc4dbc61aa9e9c8c166528b/charset_normalizer-3.4.7-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:3bec022aec2c514d9cf199522a802bd007cd588ab17ab2525f20f9c34d067c18", size = 224282, upload-time = "2026-04-02T09:26:49.684Z" },
-    { url = "https://files.pythonhosted.org/packages/fa/07/330e3a0dda4c404d6da83b327270906e9654a24f6c546dc886a0eb0ffb23/charset_normalizer-3.4.7-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:e044c39e41b92c845bc815e5ae4230804e8e7bc29e399b0437d64222d92809dd", size = 215595, upload-time = "2026-04-02T09:26:50.915Z" },
-    { url = "https://files.pythonhosted.org/packages/e3/7c/fc890655786e423f02556e0216d4b8c6bcb6bdfa890160dc66bf52dee468/charset_normalizer-3.4.7-cp313-cp313-manylinux_2_31_armv7l.whl", hash = "sha256:f495a1652cf3fbab2eb0639776dad966c2fb874d79d87ca07f9d5f059b8bd215", size = 201986, upload-time = "2026-04-02T09:26:52.197Z" },
-    { url = "https://files.pythonhosted.org/packages/d8/97/bfb18b3db2aed3b90cf54dc292ad79fdd5ad65c4eae454099475cbeadd0d/charset_normalizer-3.4.7-cp313-cp313-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:e712b419df8ba5e42b226c510472b37bd57b38e897d3eca5e8cfd410a29fa859", size = 211711, upload-time = "2026-04-02T09:26:53.49Z" },
-    { url = "https://files.pythonhosted.org/packages/6f/a5/a581c13798546a7fd557c82614a5c65a13df2157e9ad6373166d2a3e645d/charset_normalizer-3.4.7-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:7804338df6fcc08105c7745f1502ba68d900f45fd770d5bdd5288ddccb8a42d8", size = 210036, upload-time = "2026-04-02T09:26:54.975Z" },
-    { url = "https://files.pythonhosted.org/packages/8c/bf/b3ab5bcb478e4193d517644b0fb2bf5497fbceeaa7a1bc0f4d5b50953861/charset_normalizer-3.4.7-cp313-cp313-musllinux_1_2_armv7l.whl", hash = "sha256:481551899c856c704d58119b5025793fa6730adda3571971af568f66d2424bb5", size = 202998, upload-time = "2026-04-02T09:26:56.303Z" },
-    { url = "https://files.pythonhosted.org/packages/e7/4e/23efd79b65d314fa320ec6017b4b5834d5c12a58ba4610aa353af2e2f577/charset_normalizer-3.4.7-cp313-cp313-musllinux_1_2_ppc64le.whl", hash = "sha256:f59099f9b66f0d7145115e6f80dd8b1d847176df89b234a5a6b3f00437aa0832", size = 230056, upload-time = "2026-04-02T09:26:57.554Z" },
-    { url = "https://files.pythonhosted.org/packages/b9/9f/1e1941bc3f0e01df116e68dc37a55c4d249df5e6fa77f008841aef68264f/charset_normalizer-3.4.7-cp313-cp313-musllinux_1_2_riscv64.whl", hash = "sha256:f59ad4c0e8f6bba240a9bb85504faa1ab438237199d4cce5f622761507b8f6a6", size = 211537, upload-time = "2026-04-02T09:26:58.843Z" },
-    { url = "https://files.pythonhosted.org/packages/80/0f/088cbb3020d44428964a6c97fe1edfb1b9550396bf6d278330281e8b709c/charset_normalizer-3.4.7-cp313-cp313-musllinux_1_2_s390x.whl", hash = "sha256:3dedcc22d73ec993f42055eff4fcfed9318d1eeb9a6606c55892a26964964e48", size = 226176, upload-time = "2026-04-02T09:27:00.437Z" },
-    { url = "https://files.pythonhosted.org/packages/6a/9f/130394f9bbe06f4f63e22641d32fc9b202b7e251c9aef4db044324dac493/charset_normalizer-3.4.7-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:64f02c6841d7d83f832cd97ccf8eb8a906d06eb95d5276069175c696b024b60a", size = 217723, upload-time = "2026-04-02T09:27:02.021Z" },
-    { url = "https://files.pythonhosted.org/packages/73/55/c469897448a06e49f8fa03f6caae97074fde823f432a98f979cc42b90e69/charset_normalizer-3.4.7-cp313-cp313-win32.whl", hash = "sha256:4042d5c8f957e15221d423ba781e85d553722fc4113f523f2feb7b188cc34c5e", size = 148085, upload-time = "2026-04-02T09:27:03.192Z" },
-    { url = "https://files.pythonhosted.org/packages/5d/78/1b74c5bbb3f99b77a1715c91b3e0b5bdb6fe302d95ace4f5b1bec37b0167/charset_normalizer-3.4.7-cp313-cp313-win_amd64.whl", hash = "sha256:3946fa46a0cf3e4c8cb1cc52f56bb536310d34f25f01ca9b6c16afa767dab110", size = 158819, upload-time = "2026-04-02T09:27:04.454Z" },
-    { url = "https://files.pythonhosted.org/packages/68/86/46bd42279d323deb8687c4a5a811fd548cb7d1de10cf6535d099877a9a9f/charset_normalizer-3.4.7-cp313-cp313-win_arm64.whl", hash = "sha256:80d04837f55fc81da168b98de4f4b797ef007fc8a79ab71c6ec9bc4dd662b15b", size = 147915, upload-time = "2026-04-02T09:27:05.971Z" },
-    { url = "https://files.pythonhosted.org/packages/97/c8/c67cb8c70e19ef1960b97b22ed2a1567711de46c4ddf19799923adc836c2/charset_normalizer-3.4.7-cp314-cp314-macosx_10_15_universal2.whl", hash = "sha256:c36c333c39be2dbca264d7803333c896ab8fa7d4d6f0ab7edb7dfd7aea6e98c0", size = 309234, upload-time = "2026-04-02T09:27:07.194Z" },
-    { url = "https://files.pythonhosted.org/packages/99/85/c091fdee33f20de70d6c8b522743b6f831a2f1cd3ff86de4c6a827c48a76/charset_normalizer-3.4.7-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:1c2aed2e5e41f24ea8ef1590b8e848a79b56f3a5564a65ceec43c9d692dc7d8a", size = 208042, upload-time = "2026-04-02T09:27:08.749Z" },
-    { url = "https://files.pythonhosted.org/packages/87/1c/ab2ce611b984d2fd5d86a5a8a19c1ae26acac6bad967da4967562c75114d/charset_normalizer-3.4.7-cp314-cp314-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:54523e136b8948060c0fa0bc7b1b50c32c186f2fceee897a495406bb6e311d2b", size = 228706, upload-time = "2026-04-02T09:27:09.951Z" },
-    { url = "https://files.pythonhosted.org/packages/a8/29/2b1d2cb00bf085f59d29eb773ce58ec2d325430f8c216804a0a5cd83cbca/charset_normalizer-3.4.7-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:715479b9a2802ecac752a3b0efa2b0b60285cf962ee38414211abdfccc233b41", size = 224727, upload-time = "2026-04-02T09:27:11.175Z" },
-    { url = "https://files.pythonhosted.org/packages/47/5c/032c2d5a07fe4d4855fea851209cca2b6f03ebeb6d4e3afdb3358386a684/charset_normalizer-3.4.7-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:bd6c2a1c7573c64738d716488d2cdd3c00e340e4835707d8fdb8dc1a66ef164e", size = 215882, upload-time = "2026-04-02T09:27:12.446Z" },
-    { url = "https://files.pythonhosted.org/packages/2c/c2/356065d5a8b78ed04499cae5f339f091946a6a74f91e03476c33f0ab7100/charset_normalizer-3.4.7-cp314-cp314-manylinux_2_31_armv7l.whl", hash = "sha256:c45e9440fb78f8ddabcf714b68f936737a121355bf59f3907f4e17721b9d1aae", size = 200860, upload-time = "2026-04-02T09:27:13.721Z" },
-    { url = "https://files.pythonhosted.org/packages/0c/cd/a32a84217ced5039f53b29f460962abb2d4420def55afabe45b1c3c7483d/charset_normalizer-3.4.7-cp314-cp314-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:3534e7dcbdcf757da6b85a0bbf5b6868786d5982dd959b065e65481644817a18", size = 211564, upload-time = "2026-04-02T09:27:15.272Z" },
-    { url = "https://files.pythonhosted.org/packages/44/86/58e6f13ce26cc3b8f4a36b94a0f22ae2f00a72534520f4ae6857c4b81f89/charset_normalizer-3.4.7-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:e8ac484bf18ce6975760921bb6148041faa8fef0547200386ea0b52b5d27bf7b", size = 211276, upload-time = "2026-04-02T09:27:16.834Z" },
-    { url = "https://files.pythonhosted.org/packages/8f/fe/d17c32dc72e17e155e06883efa84514ca375f8a528ba2546bee73fc4df81/charset_normalizer-3.4.7-cp314-cp314-musllinux_1_2_armv7l.whl", hash = "sha256:a5fe03b42827c13cdccd08e6c0247b6a6d4b5e3cdc53fd1749f5896adcdc2356", size = 201238, upload-time = "2026-04-02T09:27:18.229Z" },
-    { url = "https://files.pythonhosted.org/packages/6a/29/f33daa50b06525a237451cdb6c69da366c381a3dadcd833fa5676bc468b3/charset_normalizer-3.4.7-cp314-cp314-musllinux_1_2_ppc64le.whl", hash = "sha256:2d6eb928e13016cea4f1f21d1e10c1cebd5a421bc57ddf5b1142ae3f86824fab", size = 230189, upload-time = "2026-04-02T09:27:19.445Z" },
-    { url = "https://files.pythonhosted.org/packages/b6/6e/52c84015394a6a0bdcd435210a7e944c5f94ea1055f5cc5d56c5fe368e7b/charset_normalizer-3.4.7-cp314-cp314-musllinux_1_2_riscv64.whl", hash = "sha256:e74327fb75de8986940def6e8dee4f127cc9752bee7355bb323cc5b2659b6d46", size = 211352, upload-time = "2026-04-02T09:27:20.79Z" },
-    { url = "https://files.pythonhosted.org/packages/8c/d7/4353be581b373033fb9198bf1da3cf8f09c1082561e8e922aa7b39bf9fe8/charset_normalizer-3.4.7-cp314-cp314-musllinux_1_2_s390x.whl", hash = "sha256:d6038d37043bced98a66e68d3aa2b6a35505dc01328cd65217cefe82f25def44", size = 227024, upload-time = "2026-04-02T09:27:22.063Z" },
-    { url = "https://files.pythonhosted.org/packages/30/45/99d18aa925bd1740098ccd3060e238e21115fffbfdcb8f3ece837d0ace6c/charset_normalizer-3.4.7-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:7579e913a5339fb8fa133f6bbcfd8e6749696206cf05acdbdca71a1b436d8e72", size = 217869, upload-time = "2026-04-02T09:27:23.486Z" },
-    { url = "https://files.pythonhosted.org/packages/5c/05/5ee478aa53f4bb7996482153d4bfe1b89e0f087f0ab6b294fcf92d595873/charset_normalizer-3.4.7-cp314-cp314-win32.whl", hash = "sha256:5b77459df20e08151cd6f8b9ef8ef1f961ef73d85c21a555c7eed5b79410ec10", size = 148541, upload-time = "2026-04-02T09:27:25.146Z" },
-    { url = "https://files.pythonhosted.org/packages/48/77/72dcb0921b2ce86420b2d79d454c7022bf5be40202a2a07906b9f2a35c97/charset_normalizer-3.4.7-cp314-cp314-win_amd64.whl", hash = "sha256:92a0a01ead5e668468e952e4238cccd7c537364eb7d851ab144ab6627dbbe12f", size = 159634, upload-time = "2026-04-02T09:27:26.642Z" },
-    { url = "https://files.pythonhosted.org/packages/c6/a3/c2369911cd72f02386e4e340770f6e158c7980267da16af8f668217abaa0/charset_normalizer-3.4.7-cp314-cp314-win_arm64.whl", hash = "sha256:67f6279d125ca0046a7fd386d01b311c6363844deac3e5b069b514ba3e63c246", size = 148384, upload-time = "2026-04-02T09:27:28.271Z" },
-    { url = "https://files.pythonhosted.org/packages/94/09/7e8a7f73d24dba1f0035fbbf014d2c36828fc1bf9c88f84093e57d315935/charset_normalizer-3.4.7-cp314-cp314t-macosx_10_15_universal2.whl", hash = "sha256:effc3f449787117233702311a1b7d8f59cba9ced946ba727bdc329ec69028e24", size = 330133, upload-time = "2026-04-02T09:27:29.474Z" },
-    { url = "https://files.pythonhosted.org/packages/8d/da/96975ddb11f8e977f706f45cddd8540fd8242f71ecdb5d18a80723dcf62c/charset_normalizer-3.4.7-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:fbccdc05410c9ee21bbf16a35f4c1d16123dcdeb8a1d38f33654fa21d0234f79", size = 216257, upload-time = "2026-04-02T09:27:30.793Z" },
-    { url = "https://files.pythonhosted.org/packages/e5/e8/1d63bf8ef2d388e95c64b2098f45f84758f6d102a087552da1485912637b/charset_normalizer-3.4.7-cp314-cp314t-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:733784b6d6def852c814bce5f318d25da2ee65dd4839a0718641c696e09a2960", size = 234851, upload-time = "2026-04-02T09:27:32.44Z" },
-    { url = "https://files.pythonhosted.org/packages/9b/40/e5ff04233e70da2681fa43969ad6f66ca5611d7e669be0246c4c7aaf6dc8/charset_normalizer-3.4.7-cp314-cp314t-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:a89c23ef8d2c6b27fd200a42aa4ac72786e7c60d40efdc76e6011260b6e949c4", size = 233393, upload-time = "2026-04-02T09:27:34.03Z" },
-    { url = "https://files.pythonhosted.org/packages/be/c1/06c6c49d5a5450f76899992f1ee40b41d076aee9279b49cf9974d2f313d5/charset_normalizer-3.4.7-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:6c114670c45346afedc0d947faf3c7f701051d2518b943679c8ff88befe14f8e", size = 223251, upload-time = "2026-04-02T09:27:35.369Z" },
-    { url = "https://files.pythonhosted.org/packages/2b/9f/f2ff16fb050946169e3e1f82134d107e5d4ae72647ec8a1b1446c148480f/charset_normalizer-3.4.7-cp314-cp314t-manylinux_2_31_armv7l.whl", hash = "sha256:a180c5e59792af262bf263b21a3c49353f25945d8d9f70628e73de370d55e1e1", size = 206609, upload-time = "2026-04-02T09:27:36.661Z" },
-    { url = "https://files.pythonhosted.org/packages/69/d5/a527c0cd8d64d2eab7459784fb4169a0ac76e5a6fc5237337982fd61347e/charset_normalizer-3.4.7-cp314-cp314t-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:3c9a494bc5ec77d43cea229c4f6db1e4d8fe7e1bbffa8b6f0f0032430ff8ab44", size = 220014, upload-time = "2026-04-02T09:27:38.019Z" },
-    { url = "https://files.pythonhosted.org/packages/7e/80/8a7b8104a3e203074dc9aa2c613d4b726c0e136bad1cc734594b02867972/charset_normalizer-3.4.7-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:8d828b6667a32a728a1ad1d93957cdf37489c57b97ae6c4de2860fa749b8fc1e", size = 218979, upload-time = "2026-04-02T09:27:39.37Z" },
-    { url = "https://files.pythonhosted.org/packages/02/9a/b759b503d507f375b2b5c153e4d2ee0a75aa215b7f2489cf314f4541f2c0/charset_normalizer-3.4.7-cp314-cp314t-musllinux_1_2_armv7l.whl", hash = "sha256:cf1493cd8607bec4d8a7b9b004e699fcf8f9103a9284cc94962cb73d20f9d4a3", size = 209238, upload-time = "2026-04-02T09:27:40.722Z" },
-    { url = "https://files.pythonhosted.org/packages/c2/4e/0f3f5d47b86bdb79256e7290b26ac847a2832d9a4033f7eb2cd4bcf4bb5b/charset_normalizer-3.4.7-cp314-cp314t-musllinux_1_2_ppc64le.whl", hash = "sha256:0c96c3b819b5c3e9e165495db84d41914d6894d55181d2d108cc1a69bfc9cce0", size = 236110, upload-time = "2026-04-02T09:27:42.33Z" },
-    { url = "https://files.pythonhosted.org/packages/96/23/bce28734eb3ed2c91dcf93abeb8a5cf393a7b2749725030bb630e554fdd8/charset_normalizer-3.4.7-cp314-cp314t-musllinux_1_2_riscv64.whl", hash = "sha256:752a45dc4a6934060b3b0dab47e04edc3326575f82be64bc4fc293914566503e", size = 219824, upload-time = "2026-04-02T09:27:43.924Z" },
-    { url = "https://files.pythonhosted.org/packages/2c/6f/6e897c6984cc4d41af319b077f2f600fc8214eb2fe2d6bcb79141b882400/charset_normalizer-3.4.7-cp314-cp314t-musllinux_1_2_s390x.whl", hash = "sha256:8778f0c7a52e56f75d12dae53ae320fae900a8b9b4164b981b9c5ce059cd1fcb", size = 233103, upload-time = "2026-04-02T09:27:45.348Z" },
-    { url = "https://files.pythonhosted.org/packages/76/22/ef7bd0fe480a0ae9b656189ec00744b60933f68b4f42a7bb06589f6f576a/charset_normalizer-3.4.7-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:ce3412fbe1e31eb81ea42f4169ed94861c56e643189e1e75f0041f3fe7020abe", size = 225194, upload-time = "2026-04-02T09:27:46.706Z" },
-    { url = "https://files.pythonhosted.org/packages/c5/a7/0e0ab3e0b5bc1219bd80a6a0d4d72ca74d9250cb2382b7c699c147e06017/charset_normalizer-3.4.7-cp314-cp314t-win32.whl", hash = "sha256:c03a41a8784091e67a39648f70c5f97b5b6a37f216896d44d2cdcb82615339a0", size = 159827, upload-time = "2026-04-02T09:27:48.053Z" },
-    { url = "https://files.pythonhosted.org/packages/7a/1d/29d32e0fb40864b1f878c7f5a0b343ae676c6e2b271a2d55cc3a152391da/charset_normalizer-3.4.7-cp314-cp314t-win_amd64.whl", hash = "sha256:03853ed82eeebbce3c2abfdbc98c96dc205f32a79627688ac9a27370ea61a49c", size = 174168, upload-time = "2026-04-02T09:27:49.795Z" },
-    { url = "https://files.pythonhosted.org/packages/de/32/d92444ad05c7a6e41fb2036749777c163baf7a0301a040cb672d6b2b1ae9/charset_normalizer-3.4.7-cp314-cp314t-win_arm64.whl", hash = "sha256:c35abb8bfff0185efac5878da64c45dafd2b37fb0383add1be155a763c1f083d", size = 153018, upload-time = "2026-04-02T09:27:51.116Z" },
-    { url = "https://files.pythonhosted.org/packages/db/8f/61959034484a4a7c527811f4721e75d02d653a35afb0b6054474d8185d4c/charset_normalizer-3.4.7-py3-none-any.whl", hash = "sha256:3dce51d0f5e7951f8bb4900c257dad282f49190fdbebecd4ba99bcc41fef404d", size = 61958, upload-time = "2026-04-02T09:28:37.794Z" },
-]
-
 [[package]]
 name = "click"
 version = "8.4.0"
@@ -379,65 +209,6 @@ toml = [
     { name = "tomli", marker = "python_full_version <= '3.11'" },
 ]
 
-[[package]]
-name = "cryptography"
-version = "48.0.0"
-source = { registry = "https://pypi.org/simple" }
-dependencies = [
-    { name = "cffi", marker = "platform_python_implementation != 'PyPy'" },
-]
-sdist = { url = "https://files.pythonhosted.org/packages/9f/a9/db8f313fdcd85d767d4973515e1db101f9c71f95fced83233de224673757/cryptography-48.0.0.tar.gz", hash = "sha256:5c3932f4436d1cccb036cb0eaef46e6e2db91035166f1ad6505c3c9d5a635920", size = 832984, upload-time = "2026-05-04T22:59:38.133Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/df/3d/01f6dd9190170a5a241e0e98c2d04be3664a9e6f5b9b872cde63aff1c3dd/cryptography-48.0.0-cp311-abi3-macosx_10_9_universal2.whl", hash = "sha256:0c558d2cdffd8f4bbb30fc7134c74d2ca9a476f830bb053074498fbc86f41ed6", size = 8001587, upload-time = "2026-05-04T22:57:36.803Z" },
-    { url = "https://files.pythonhosted.org/packages/b2/6e/e90527eef33f309beb811cf7c982c3aeffcce8e3edb178baa4ca3ae4a6fa/cryptography-48.0.0-cp311-abi3-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:f5333311663ea94f75dd408665686aaf426563556bb5283554a3539177e03b8c", size = 4690433, upload-time = "2026-05-04T22:57:40.373Z" },
-    { url = "https://files.pythonhosted.org/packages/90/04/673510ed51ddff56575f306cf1617d80411ee76831ccd3097599140efdfe/cryptography-48.0.0-cp311-abi3-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:7995ef305d7165c3f11ae07f2517e5a4f1d5c18da1376a0a9ed496336b69e5f3", size = 4710620, upload-time = "2026-05-04T22:57:42.935Z" },
-    { url = "https://files.pythonhosted.org/packages/14/d5/e9c4ef932c8d800490c34d8bd589d64a31d5890e27ec9e9ad532be893294/cryptography-48.0.0-cp311-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:40ba1f85eaa6959837b1d51c9767e230e14612eea4ef110ee8854ada22da1bf5", size = 4696283, upload-time = "2026-05-04T22:57:45.294Z" },
-    { url = "https://files.pythonhosted.org/packages/0c/29/174b9dfb60b12d59ecfc6cfa04bc88c21b42a54f01b8aae09bb6e51e4c7f/cryptography-48.0.0-cp311-abi3-manylinux_2_28_ppc64le.whl", hash = "sha256:369a6348999f94bbd53435c894377b20ab95f25a9065c283570e70150d8abc3c", size = 5296573, upload-time = "2026-05-04T22:57:47.933Z" },
-    { url = "https://files.pythonhosted.org/packages/95/38/0d29a6fd7d0d1373f0c0c88a04ba20e359b257753ac497564cd660fc1d55/cryptography-48.0.0-cp311-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:a0e692c683f4df67815a2d258b324e66f4738bd7a96a218c826dce4f4bd05d8f", size = 4743677, upload-time = "2026-05-04T22:57:50.067Z" },
-    { url = "https://files.pythonhosted.org/packages/30/be/eef653013d5c63b6a490529e0316f9ac14a37602965d4903efed1399f32b/cryptography-48.0.0-cp311-abi3-manylinux_2_31_armv7l.whl", hash = "sha256:18349bbc56f4743c8b12dc32e2bccb2cf83ee8b69a3bba74ef8ae857e26b3d25", size = 4330808, upload-time = "2026-05-04T22:57:52.301Z" },
-    { url = "https://files.pythonhosted.org/packages/84/9e/500463e87abb7a0a0f9f256ec21123ecde0a7b5541a15e840ea54551fd81/cryptography-48.0.0-cp311-abi3-manylinux_2_34_aarch64.whl", hash = "sha256:7e8eac43dfca5c4cccc6dad9a80504436fca53bb9bc3100a2386d730fbe6b602", size = 4695941, upload-time = "2026-05-04T22:57:54.603Z" },
-    { url = "https://files.pythonhosted.org/packages/e3/dc/7303087450c2ec9e7fbb750e17c2abfbc658f23cbd0e54009509b7cc4091/cryptography-48.0.0-cp311-abi3-manylinux_2_34_ppc64le.whl", hash = "sha256:9ccdac7d40688ecb5a3b4a604b8a88c8002e3442d6c60aead1db2a89a041560c", size = 5252579, upload-time = "2026-05-04T22:57:57.207Z" },
-    { url = "https://files.pythonhosted.org/packages/d0/c0/7101d3b7215edcdc90c45da544961fd8ed2d6448f77577460fa75a8443f7/cryptography-48.0.0-cp311-abi3-manylinux_2_34_x86_64.whl", hash = "sha256:bd72e68b06bb1e96913f97dd4901119bc17f39d4586a5adf2d3e47bc2b9d58b5", size = 4743326, upload-time = "2026-05-04T22:57:59.535Z" },
-    { url = "https://files.pythonhosted.org/packages/ac/d8/5b833bad13016f562ab9d063d68199a4bd121d18458e439515601d3357ec/cryptography-48.0.0-cp311-abi3-musllinux_1_2_aarch64.whl", hash = "sha256:59baa2cb386c4f0b9905bd6eb4c2a79a69a128408fd31d32ca4d7102d4156321", size = 4826672, upload-time = "2026-05-04T22:58:01.996Z" },
-    { url = "https://files.pythonhosted.org/packages/98/e1/7074eb8bf3c135558c73fc2bcf0f5633f912e6fb87e868a55c454080ef09/cryptography-48.0.0-cp311-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:9249e3cd978541d665967ac2cb2787fd6a62bddf1e75b3e347a594d7dacf4f74", size = 4972574, upload-time = "2026-05-04T22:58:03.968Z" },
-    { url = "https://files.pythonhosted.org/packages/04/70/e5a1b41d325f797f39427aa44ef8baf0be500065ab6d8e10369d850d4a4f/cryptography-48.0.0-cp311-abi3-win32.whl", hash = "sha256:9c459db21422be75e2809370b829a87eb37f74cd785fc4aa9ea1e5f43b47cda4", size = 3294868, upload-time = "2026-05-04T22:58:06.467Z" },
-    { url = "https://files.pythonhosted.org/packages/f4/ac/8ac51b4a5fc5932eb7ee5c517ba7dc8cd834f0048962b6b352f00f41ebf9/cryptography-48.0.0-cp311-abi3-win_amd64.whl", hash = "sha256:5b012212e08b8dd5edc78ef54da83dd9892fd9105323b3993eff6bea65dc21d7", size = 3817107, upload-time = "2026-05-04T22:58:08.845Z" },
-    { url = "https://files.pythonhosted.org/packages/6b/84/70e3feea9feea87fd7cbe77efb2712ae1e3e6edf10749dc6e95f4e60e455/cryptography-48.0.0-cp314-cp314t-macosx_10_9_universal2.whl", hash = "sha256:3cb07a3ed6431663cd321ea8a000a1314c74211f823e4177fefa2255e057d1ec", size = 7986556, upload-time = "2026-05-04T22:58:11.172Z" },
-    { url = "https://files.pythonhosted.org/packages/89/6e/18e07a618bb5442ba10cf4df16e99c071365528aa570dfcb8c02e25a303b/cryptography-48.0.0-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:8c7378637d7d88016fa6791c159f698b3d3eed28ebf844ac36b9dc04a14dae18", size = 4684776, upload-time = "2026-05-04T22:58:13.712Z" },
-    { url = "https://files.pythonhosted.org/packages/be/6a/4ea3b4c6c6759794d5ee2103c304a5076dc4b19ae1f9fe47dba439e159e9/cryptography-48.0.0-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:cc90c0b39b2e3c65ef52c804b72e3c58f8a04ab2a1871272798e5f9572c17d20", size = 4698121, upload-time = "2026-05-04T22:58:16.448Z" },
-    { url = "https://files.pythonhosted.org/packages/2f/59/6ff6ad6cae03bb887da2a5860b2c9805f8dac969ef01ce563336c49bd1d1/cryptography-48.0.0-cp314-cp314t-manylinux_2_28_aarch64.whl", hash = "sha256:76341972e1eff8b4bea859f09c0d3e64b96ce931b084f9b9b7db8ef364c30eff", size = 4690042, upload-time = "2026-05-04T22:58:18.544Z" },
-    { url = "https://files.pythonhosted.org/packages/ca/b4/fc334ed8cfd705aca282fe4d8f5ae64a8e0f74932e9feecb344610cf6e4d/cryptography-48.0.0-cp314-cp314t-manylinux_2_28_ppc64le.whl", hash = "sha256:55b7718303bf06a5753dcdccf2f3945cf18ad7bffde41b61226e4db31ab89a9c", size = 5282526, upload-time = "2026-05-04T22:58:20.75Z" },
-    { url = "https://files.pythonhosted.org/packages/11/08/9f8c5386cc4cd90d8255c7cdd0f5baf459a08502a09de30dc51f553d38dc/cryptography-48.0.0-cp314-cp314t-manylinux_2_28_x86_64.whl", hash = "sha256:a64697c641c7b1b2178e573cbc31c7c6684cd56883a478d75143dbb7118036db", size = 4733116, upload-time = "2026-05-04T22:58:23.627Z" },
-    { url = "https://files.pythonhosted.org/packages/b8/77/99307d7574045699f8805aa500fa0fb83422d115b5400a064ddd306d7750/cryptography-48.0.0-cp314-cp314t-manylinux_2_31_armv7l.whl", hash = "sha256:561215ea3879cb1cbbf272867e2efda62476f240fb58c64de6b393ae19246741", size = 4316030, upload-time = "2026-05-04T22:58:25.581Z" },
-    { url = "https://files.pythonhosted.org/packages/fd/36/a608b98337af3cb2aff4818e406649d30572b7031918b04c87d979495348/cryptography-48.0.0-cp314-cp314t-manylinux_2_34_aarch64.whl", hash = "sha256:ad64688338ed4bc1a6618076ba75fd7194a5f1797ac60b47afe926285adb3166", size = 4689640, upload-time = "2026-05-04T22:58:27.747Z" },
-    { url = "https://files.pythonhosted.org/packages/dd/a6/825010a291b4438aecc1f568bc428189fc1175515223632477c07dc0a6df/cryptography-48.0.0-cp314-cp314t-manylinux_2_34_ppc64le.whl", hash = "sha256:906cbf0670286c6e0044156bc7d4af9cbb0ef6db9f73e52c3ec56ba6bdde5336", size = 5237657, upload-time = "2026-05-04T22:58:29.848Z" },
-    { url = "https://files.pythonhosted.org/packages/b9/09/4e76a09b4caa29aad535ddc806f5d4c5d01885bd978bd984fbc6ca032cae/cryptography-48.0.0-cp314-cp314t-manylinux_2_34_x86_64.whl", hash = "sha256:ea8990436d914540a40ab24b6a77c0969695ed52f4a4874c5137ccf7045a7057", size = 4732362, upload-time = "2026-05-04T22:58:32.009Z" },
-    { url = "https://files.pythonhosted.org/packages/18/78/444fa04a77d0cb95f417dda20d450e13c56ba8e5220fc892a1658f44f882/cryptography-48.0.0-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:c18684a7f0cc9a3cb60328f496b8e3372def7c5d2df39ac267878b05565aaaae", size = 4819580, upload-time = "2026-05-04T22:58:34.254Z" },
-    { url = "https://files.pythonhosted.org/packages/38/85/ea67067c70a1fd4be2c63d35eeed82658023021affccc7b17705f8527dd2/cryptography-48.0.0-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:9be5aafa5736574f8f15f262adc81b2a9869e2cfe9014d52a44633905b40d52c", size = 4963283, upload-time = "2026-05-04T22:58:36.376Z" },
-    { url = "https://files.pythonhosted.org/packages/75/54/cc6d0f3deac3e81c7f847e8a189a12b6cdd65059b43dad25d4316abd849a/cryptography-48.0.0-cp314-cp314t-win32.whl", hash = "sha256:c17dfe85494deaeddc5ce251aebd1d60bbe6afc8b62071bb0b469431a000124f", size = 3270954, upload-time = "2026-05-04T22:58:38.791Z" },
-    { url = "https://files.pythonhosted.org/packages/49/67/cc947e288c0758a4e5473d1dcb743037ab7785541265a969240b8885441a/cryptography-48.0.0-cp314-cp314t-win_amd64.whl", hash = "sha256:27241b1dc9962e056062a8eef1991d02c3a24569c95975bd2322a8a52c6e5e12", size = 3797313, upload-time = "2026-05-04T22:58:40.746Z" },
-    { url = "https://files.pythonhosted.org/packages/f2/63/61d4a4e1c6b6bab6ce1e213cd36a24c415d90e76d78c5eb8577c5541d2e8/cryptography-48.0.0-cp39-abi3-macosx_10_9_universal2.whl", hash = "sha256:58d00498e8933e4a194f3076aee1b4a97dfec1a6da444535755822fe5d8b0b86", size = 7983482, upload-time = "2026-05-04T22:58:43.769Z" },
-    { url = "https://files.pythonhosted.org/packages/d5/ac/f5b5995b87770c693e2596559ffafe195b4033a57f14a82268a2842953f3/cryptography-48.0.0-cp39-abi3-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:614d0949f4790582d2cc25553abd09dd723025f0c0e7c67376a1d77196743d6e", size = 4683266, upload-time = "2026-05-04T22:58:46.064Z" },
-    { url = "https://files.pythonhosted.org/packages/ec/c6/8b14f67e18338fbc4adb76f66c001f5c3610b3e2d1837f268f47a347dbbb/cryptography-48.0.0-cp39-abi3-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:7ce4bfae76319a532a2dc68f82cc32f5676ee792a983187dac07183690e5c66f", size = 4696228, upload-time = "2026-05-04T22:58:48.22Z" },
-    { url = "https://files.pythonhosted.org/packages/ea/73/f808fbae9514bd91b47875b003f13e284c8c6bdfd904b7944e803937eec1/cryptography-48.0.0-cp39-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:2eb992bbd4661238c5a397594c83f5b4dc2bc5b848c365c8f991b6780efcc5c7", size = 4689097, upload-time = "2026-05-04T22:58:50.9Z" },
-    { url = "https://files.pythonhosted.org/packages/93/01/d86632d7d28db8ae83221995752eeb6639ffb374c2d22955648cf8d52797/cryptography-48.0.0-cp39-abi3-manylinux_2_28_ppc64le.whl", hash = "sha256:22a5cb272895dce158b2cacdfdc3debd299019659f42947dbdac6f32d68fe832", size = 5283582, upload-time = "2026-05-04T22:58:53.017Z" },
-    { url = "https://files.pythonhosted.org/packages/02/e1/50edc7a50334807cc4791fc4a0ce7468b4a1416d9138eab358bfc9a3d70b/cryptography-48.0.0-cp39-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:2b4d59804e8408e2fea7d1fbaf218e5ec984325221db76e6a241a9abd6cdd95c", size = 4730479, upload-time = "2026-05-04T22:58:55.611Z" },
-    { url = "https://files.pythonhosted.org/packages/6f/af/99a582b1b1641ff5911ac559beb45097cf79efd4ead4657f578ef1af2d47/cryptography-48.0.0-cp39-abi3-manylinux_2_31_armv7l.whl", hash = "sha256:984a20b0f62a26f48a3396c72e4bc34c66e356d356bf370053066b3b6d54634a", size = 4326481, upload-time = "2026-05-04T22:58:57.607Z" },
-    { url = "https://files.pythonhosted.org/packages/90/ee/89aa26a06ef0a7d7611788ffd571a7c50e368cc6a4d5eef8b4884e866edb/cryptography-48.0.0-cp39-abi3-manylinux_2_34_aarch64.whl", hash = "sha256:5a5ed8fde7a1d09376ca0b40e68cd59c69fe23b1f9768bd5824f54681626032a", size = 4688713, upload-time = "2026-05-04T22:59:00.077Z" },
-    { url = "https://files.pythonhosted.org/packages/70/ba/bcb1b0bb7a33d4c7c0c4d4c7874b4a62ae4f56113a5f4baefa362dfb1f0f/cryptography-48.0.0-cp39-abi3-manylinux_2_34_ppc64le.whl", hash = "sha256:8cd666227ef7af430aa5914a9910e0ddd703e75f039cef0825cd0da71b6b711a", size = 5238165, upload-time = "2026-05-04T22:59:02.317Z" },
-    { url = "https://files.pythonhosted.org/packages/c9/70/ca4003b1ce5ca3dc3186ada51908c8a9b9ff7d5cab83cc0d43ee14ec144f/cryptography-48.0.0-cp39-abi3-manylinux_2_34_x86_64.whl", hash = "sha256:9071196d81abc88b3516ac8cdfad32e2b66dd4a5393a8e68a961e9161ddc6239", size = 4729947, upload-time = "2026-05-04T22:59:05.255Z" },
-    { url = "https://files.pythonhosted.org/packages/44/a0/4ec7cf774207905aef1a8d11c3750d5a1db805eb380ee4e16df317870128/cryptography-48.0.0-cp39-abi3-musllinux_1_2_aarch64.whl", hash = "sha256:1e2d54c8be6152856a36f0882ab231e70f8ec7f14e93cf87db8a2ed056bf160c", size = 4822059, upload-time = "2026-05-04T22:59:07.802Z" },
-    { url = "https://files.pythonhosted.org/packages/1e/75/a2e55f99c16fcac7b5d6c1eb19ad8e00799854d6be5ca845f9259eae1681/cryptography-48.0.0-cp39-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:a5da777e32ffed6f85a7b2b3f7c5cbc88c146bfcd0a1d7baf5fcc6c52ee35dd4", size = 4960575, upload-time = "2026-05-04T22:59:09.851Z" },
-    { url = "https://files.pythonhosted.org/packages/b8/23/6e6f32143ab5d8b36ca848a502c4bcd477ae75b9e1677e3530d669062578/cryptography-48.0.0-cp39-abi3-win32.whl", hash = "sha256:77a2ccbbe917f6710e05ba9adaa25fb5075620bf3ea6fb751997875aff4ae4bd", size = 3279117, upload-time = "2026-05-04T22:59:12.019Z" },
-    { url = "https://files.pythonhosted.org/packages/9d/9a/0fea98a70cf1749d41d738836f6349d97945f7c89433a259a6c2642eefeb/cryptography-48.0.0-cp39-abi3-win_amd64.whl", hash = "sha256:16cd65b9330583e4619939b3a3843eec1e6e789744bb01e7c7e2e62e33c239c8", size = 3792100, upload-time = "2026-05-04T22:59:14.884Z" },
-    { url = "https://files.pythonhosted.org/packages/be/d2/024b5e06be9d44cb021fb0e1a03d34d63989cf56a0fe62f3dfbab695b9b4/cryptography-48.0.0-pp311-pypy311_pp73-macosx_11_0_arm64.whl", hash = "sha256:84cf79f0dc8b36ac5da873481716e87aef31fcfa0444f9e1d8b4b2cece142855", size = 3950391, upload-time = "2026-05-04T22:59:17.415Z" },
-    { url = "https://files.pythonhosted.org/packages/bc/17/3861e17c56fa0fd37491a14a8673fdb77c57fc5693cafe745ea8b06dba75/cryptography-48.0.0-pp311-pypy311_pp73-manylinux_2_28_aarch64.whl", hash = "sha256:fdfef35d751d510fcef5252703621574364fec16418c4a1e5e1055248401054b", size = 4637126, upload-time = "2026-05-04T22:59:20.197Z" },
-    { url = "https://files.pythonhosted.org/packages/f0/0a/7e226dbff530f21480727eb764973a7bff2b912f8e15cd4f129e71b56d1d/cryptography-48.0.0-pp311-pypy311_pp73-manylinux_2_28_x86_64.whl", hash = "sha256:0890f502ddf7d9c6426129c3f49f5c0a39278ed7cd6322c8755ffca6ee675a13", size = 4667270, upload-time = "2026-05-04T22:59:22.647Z" },
-    { url = "https://files.pythonhosted.org/packages/3b/f2/5a72274ca9f1b2a8b44a662ee0bf1b435909deb473d6f97bcd035bcdbc71/cryptography-48.0.0-pp311-pypy311_pp73-manylinux_2_34_aarch64.whl", hash = "sha256:ecde28a596bead48b0cfd2a1b4416c3d43074c2d785e3a398d7ec1fc4d0f7fbb", size = 4636797, upload-time = "2026-05-04T22:59:24.912Z" },
-    { url = "https://files.pythonhosted.org/packages/b4/e1/48cedb2fe63626e91ded1edad159e2a4fb8b6906c4425eb7749673077ce7/cryptography-48.0.0-pp311-pypy311_pp73-manylinux_2_34_x86_64.whl", hash = "sha256:4defde8685ae324a9eb9d818717e93b4638ef67070ac9bc15b8ca85f63048355", size = 4666800, upload-time = "2026-05-04T22:59:27.474Z" },
-    { url = "https://files.pythonhosted.org/packages/a2/ca/7e8365deec19afb2b2c7be7c1c0aa8f99633b54e90c570999acda93260fc/cryptography-48.0.0-pp311-pypy311_pp73-win_amd64.whl", hash = "sha256:db63bf618e5dea46c07de12e900fe1cdd2541e6dc9dbae772a70b7d4d4765f6a", size = 3739536, upload-time = "2026-05-04T22:59:29.61Z" },
-]
-
 [[package]]
 name = "decorator"
 version = "5.3.1"
@@ -585,19 +356,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/99/5d/8268b644392ee874ee82a635cd0df1773de230bde356c38de28e298392cc/parso-0.8.7-py2.py3-none-any.whl", hash = "sha256:a8926eb2a1b915486941fdbd31e86a4baf88fe8c210f25f2f35ecec5b574ca1c", size = 107025, upload-time = "2026-05-01T23:12:58.867Z" },
 ]
 
-[[package]]
-name = "pdfminer-six"
-version = "20260107"
-source = { registry = "https://pypi.org/simple" }
-dependencies = [
-    { name = "charset-normalizer" },
-    { name = "cryptography" },
-]
-sdist = { url = "https://files.pythonhosted.org/packages/34/a4/5cec1112009f0439a5ca6afa8ace321f0ab2f48da3255b7a1c8953014670/pdfminer_six-20260107.tar.gz", hash = "sha256:96bfd431e3577a55a0efd25676968ca4ce8fd5b53f14565f85716ff363889602", size = 8512094, upload-time = "2026-01-07T13:29:12.937Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/20/8b/28c4eaec9d6b036a52cb44720408f26b1a143ca9bce76cc19e8f5de00ab4/pdfminer_six-20260107-py3-none-any.whl", hash = "sha256:366585ba97e80dffa8f00cebe303d2f381884d8637af4ce422f1df3ef38111a9", size = 6592252, upload-time = "2026-01-07T13:29:10.742Z" },
-]
-
 [[package]]
 name = "pexpect"
 version = "4.9.0"
@@ -674,15 +432,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/8e/37/efad0257dc6e593a18957422533ff0f87ede7c9c6ea010a2177d738fb82f/pure_eval-0.2.3-py3-none-any.whl", hash = "sha256:1db8e35b67b3d218d818ae653e27f06c3aa420901fa7b081ca98cbedc874e0d0", size = 11842, upload-time = "2024-07-21T12:58:20.04Z" },
 ]
 
-[[package]]
-name = "pycparser"
-version = "3.0"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/1b/7d/92392ff7815c21062bea51aa7b87d45576f649f16458d78b7cf94b9ab2e6/pycparser-3.0.tar.gz", hash = "sha256:600f49d217304a5902ac3c37e1281c9fe94e4d0489de643a9504c5cdfdfc6b29", size = 103492, upload-time = "2026-01-21T14:26:51.89Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/0c/c3/44f3fbbfa403ea2a7c779186dc20772604442dde72947e7d01069cbe98e3/pycparser-3.0-py3-none-any.whl", hash = "sha256:b727414169a36b7d524c1c3e31839a521725078d7b2ff038656844266160a992", size = 48172, upload-time = "2026-01-21T14:26:50.693Z" },
-]
-
 [[package]]
 name = "pydantic"
 version = "2.13.4"
@@ -810,19 +559,32 @@ wheels = [
 ]
 
 [[package]]
-name = "pymupdf"
-version = "1.27.2.3"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/22/32/708bedc9dde7b328d45abbc076091769d44f2f24ad151ad92d56a6ec142b/pymupdf-1.27.2.3.tar.gz", hash = "sha256:7a92faa25129e8bbec5e50eeb9214f187665428c31b05c4ef6e36c58c0b1c6d2", size = 85759618, upload-time = "2026-04-24T14:13:14.42Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/dc/09/ddbdfa7ee91fbabd6f63d7d744884cbdfe3e7ff9b8604749fb38bddf5c5d/pymupdf-1.27.2.3-cp310-abi3-macosx_10_9_x86_64.whl", hash = "sha256:fc1bc3cae6e9e150b0dbb0a9221bdfd411d65f0db2fe359eaa22467d7cc2a05f", size = 24002636, upload-time = "2026-04-24T14:09:17.459Z" },
-    { url = "https://files.pythonhosted.org/packages/01/89/3f8edd6c4f50ca370e2a2f2a3011face36f3760728ffe76dffec91c0fca0/pymupdf-1.27.2.3-cp310-abi3-macosx_11_0_arm64.whl", hash = "sha256:660d93cb6da5bbddf11d3982ae27745dd3a9902d9f24cdb69adab83962294b5a", size = 23278238, upload-time = "2026-04-24T14:09:32.882Z" },
-    { url = "https://files.pythonhosted.org/packages/c3/26/b7e5a70eb83bd189f8b5df87ec442746b992f2f632662839b288170d357d/pymupdf-1.27.2.3-cp310-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:1dd460a3ae4597a755f00a3bd9771f5ebf1531dc111f6a36bf05dd00a6b84425", size = 24333923, upload-time = "2026-04-24T14:09:47.341Z" },
-    { url = "https://files.pythonhosted.org/packages/e4/a0/aa1ee2240f29481a04a827c313333b4ecd8a14d6ac3e15d3f41a30574781/pymupdf-1.27.2.3-cp310-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:857842b4888827bd6155a1131341b2822a7ebe9a8c15a975fd7d490d7a64a30c", size = 24963198, upload-time = "2026-04-24T14:10:07.408Z" },
-    { url = "https://files.pythonhosted.org/packages/69/49/4f742451f980840829fc00ba158bebb25d389c846d8f4f8c65936ee55de8/pymupdf-1.27.2.3-cp310-abi3-musllinux_1_2_x86_64.whl", hash = "sha256:580983849c64a08d08344ca3d1580e87c01f046a8392421797bc850efd72a5b6", size = 25184609, upload-time = "2026-04-24T14:10:22.911Z" },
-    { url = "https://files.pythonhosted.org/packages/f6/3f/3853d6608f394faf6eec2bd4e8ea9f6a00beea329b071abdb29f4164cc3d/pymupdf-1.27.2.3-cp310-abi3-win32.whl", hash = "sha256:a5c1088a87189891a4946ab314a14b7934ac4c5b6077f7e74ebee956f8906d0e", size = 18019286, upload-time = "2026-04-24T14:10:34.239Z" },
-    { url = "https://files.pythonhosted.org/packages/44/47/5fb10fe73f96b31253a41647c362ea9e0380920bddf16028414a051247fc/pymupdf-1.27.2.3-cp310-abi3-win_amd64.whl", hash = "sha256:d20f68ef15195e073071dbc4ae7455257c7889af7584e39df490c0a92728526e", size = 19249102, upload-time = "2026-04-24T14:10:46.72Z" },
-    { url = "https://files.pythonhosted.org/packages/53/a4/b9e91aac82293f9c954654c85581ee8212b5b05efadc534b581141241e6f/pymupdf-1.27.2.3-cp314-cp314t-manylinux_2_28_x86_64.whl", hash = "sha256:77691604c5d1d0233827139bbcdea61fd57879c84712b8e49b1f45520f7ab9c2", size = 25000393, upload-time = "2026-04-24T14:11:01.669Z" },
+name = "pypdfium2"
+version = "5.8.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/6d/3d/dc934d3b606c51c3ecc95b6731d84b7dd7ab8e513a50b0e98a4da6c8a719/pypdfium2-5.8.0.tar.gz", hash = "sha256:049397c647e50f83115ee951c49394dab9e9ba52ebdd5a11ab1109390eb3d34e", size = 271934, upload-time = "2026-05-04T17:39:43.794Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/6f/8c/6b75b923cb81368fa3ea7c48a0616b839620a3aeff899885bd930449b89e/pypdfium2-5.8.0-py3-none-android_23_arm64_v8a.whl", hash = "sha256:f67b6c74b716d9ac725ad1af49ae786ad813ac20823d45606d59f1fc06caa8af", size = 3374554, upload-time = "2026-05-04T17:39:05.552Z" },
+    { url = "https://files.pythonhosted.org/packages/ef/61/a885c7f36efba89ec98e3d1fe95c83b48c2d6dea321e9194ac6460e7a834/pypdfium2-5.8.0-py3-none-android_23_armeabi_v7a.whl", hash = "sha256:53e82bf3e6a2da170b1bda83f93b7eec57cb6efe3cacd05cba78823879a85203", size = 2831667, upload-time = "2026-05-04T17:39:08.028Z" },
+    { url = "https://files.pythonhosted.org/packages/86/1f/04b5627f6dba312d3e707e5b019c9f24d8b03b5aa366866a9e02ec00f8d4/pypdfium2-5.8.0-py3-none-macosx_11_0_arm64.whl", hash = "sha256:085e633dcc89b65ff4035a4787e98ce7ae636836eb39c83dd0db26113d9774bc", size = 3450815, upload-time = "2026-05-04T17:39:09.551Z" },
+    { url = "https://files.pythonhosted.org/packages/a9/77/8e3a2aba2bc4aef5abe1b1306d05b00588dc0bf7f5c850d1adf6164c786b/pypdfium2-5.8.0-py3-none-macosx_11_0_x86_64.whl", hash = "sha256:bc84b7c6efede88fcfb9467f81daf416f26b973a54fc1cf4d3410d622fda6d7a", size = 3634395, upload-time = "2026-05-04T17:39:11.225Z" },
+    { url = "https://files.pythonhosted.org/packages/93/11/6f2b1847d9fa457b3b7251afc2bba2706d104a0c6f01431dfae5d679a839/pypdfium2-5.8.0-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:a63bf09b2e13ba8545c930d243f0650c664a1b51314daa3b5f38df6d1a17b4bc", size = 3617413, upload-time = "2026-05-04T17:39:13.139Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/fd/99ce639de5ca06d21743c740dd988cd209dda623bc763ae10b8a162022e1/pypdfium2-5.8.0-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:937881c1698456749ed203a58db1895baa5eb7178cdb837ef84867790638da28", size = 3347639, upload-time = "2026-05-04T17:39:15.086Z" },
+    { url = "https://files.pythonhosted.org/packages/fa/47/82864cc6e26dd8969d5594c168635acb16458d35cf5fed65d6b2e32abb42/pypdfium2-5.8.0-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:6be9dc2b84a8694ad7e626bab133244e8241014d5ed1930d865a9bdf90df1e24", size = 3746404, upload-time = "2026-05-04T17:39:17.094Z" },
+    { url = "https://files.pythonhosted.org/packages/82/58/e41e49bba951f61921bac7289e67fe02af5ac57192d0bbfb5f459dc3691d/pypdfium2-5.8.0-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:7f27bd82891ae302dd02d736b14809661f6d1220ee1e96dbed9b23e2811922a3", size = 4177893, upload-time = "2026-05-04T17:39:18.729Z" },
+    { url = "https://files.pythonhosted.org/packages/b4/15/fa7031010d5cf6853dadb4864680a0bfb7782c5bb6a1a401e0c25c4fca87/pypdfium2-5.8.0-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:26c1089cdbbdc7fe1248f6d17fe3f30214be4f287dd0196b31aaee18a1564240", size = 3665152, upload-time = "2026-05-04T17:39:20.207Z" },
+    { url = "https://files.pythonhosted.org/packages/de/6a/5a3520a8b0cfa8d7fdc3f03a07ad9d6146c28ffd519330706f64fd8939a8/pypdfium2-5.8.0-py3-none-manylinux_2_27_s390x.manylinux_2_28_s390x.whl", hash = "sha256:1c038a9290864aaa4862dd32e591993d82551ca4d152b4e8ce6d43ba37dc04a8", size = 3095365, upload-time = "2026-05-04T17:39:22.054Z" },
+    { url = "https://files.pythonhosted.org/packages/32/d3/845bae4de3cfa36865959046156edb5bf9baea400ccdecdd84fdd911b0f5/pypdfium2-5.8.0-py3-none-manylinux_2_38_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:f104bc1a6d8bfc1ff088aa50db13b9729cfdb3722b44975c3c457e9a7b9c7318", size = 2961801, upload-time = "2026-05-04T17:39:23.817Z" },
+    { url = "https://files.pythonhosted.org/packages/99/76/cf54eabee4a172241dfcfe63533bd1e11e2162114a983453a5a40bfec114/pypdfium2-5.8.0-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:04ca7c57a553facf8d46c6ea8ba6fa557e698670cfa4a58e0e01fdae2f6be87d", size = 4133067, upload-time = "2026-05-04T17:39:25.619Z" },
+    { url = "https://files.pythonhosted.org/packages/77/66/dcf871d19187ca04ea184a99801a6e7e556d8347aa49540fee33cda6dfc5/pypdfium2-5.8.0-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:ad42b9c22477b32dbedcbc8232833f385d92fd0cf92822547b02383cf9a476d7", size = 3749100, upload-time = "2026-05-04T17:39:27.203Z" },
+    { url = "https://files.pythonhosted.org/packages/32/67/0d456c79660959ca45ad307b4d67161d29f9ed4083ee1e8fe8c6925b7c82/pypdfium2-5.8.0-py3-none-musllinux_1_2_i686.whl", hash = "sha256:388e3119cf5ca0979b7d5f6d40b7fcd5ab49e17ed4e6de6af89ba116061acfda", size = 4339212, upload-time = "2026-05-04T17:39:29.277Z" },
+    { url = "https://files.pythonhosted.org/packages/76/89/e5b0e0f7936be341c91c0f45cd70d693878894ed62aed93a6ee32e9c43c4/pypdfium2-5.8.0-py3-none-musllinux_1_2_ppc64le.whl", hash = "sha256:aa05bbfa485ce7916217aa78d856c9f9cd86b08b20846c650392a67975ee72e9", size = 4383943, upload-time = "2026-05-04T17:39:31.287Z" },
+    { url = "https://files.pythonhosted.org/packages/82/21/4502ed255f082f579cd3537c2971cf1a57778d43703a08bcd1a92253189f/pypdfium2-5.8.0-py3-none-musllinux_1_2_riscv64.whl", hash = "sha256:f0813a16bb39d5ebd173ea5484430bb67a89b4b181db0a636c73b64ad063c3ea", size = 3925680, upload-time = "2026-05-04T17:39:33.241Z" },
+    { url = "https://files.pythonhosted.org/packages/7d/4f/2e59723e7a07779439bd885c1b4960079c9710603308888d29ac926ae69a/pypdfium2-5.8.0-py3-none-musllinux_1_2_s390x.whl", hash = "sha256:a3c78f7d20dd821bec6c072efdb21a1370b9efe10fdeeb68c969e67608e25385", size = 4269560, upload-time = "2026-05-04T17:39:34.926Z" },
+    { url = "https://files.pythonhosted.org/packages/34/4e/7b6b1bde3788c8b880d4b8131d95d9d339cebafb3ad9102d82e234bb65be/pypdfium2-5.8.0-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:86d302e207c138c827b885a72784f7b306d840646ebeae07e8efdbc39321c629", size = 4182434, upload-time = "2026-05-04T17:39:36.624Z" },
+    { url = "https://files.pythonhosted.org/packages/11/7b/6ed4782e0d7a5278330598ce8c4b2df7255f4585a0b3d04520fa580d6507/pypdfium2-5.8.0-py3-none-win32.whl", hash = "sha256:3f25fd436920a907291462b41bdc0ab9f8235c3944b4c9c15398da595ffd1fed", size = 3636680, upload-time = "2026-05-04T17:39:38.49Z" },
+    { url = "https://files.pythonhosted.org/packages/19/55/da7223d4202b2461f4f889b0baf10dddec3db7f88e6fd8c52db4a516eecd/pypdfium2-5.8.0-py3-none-win_amd64.whl", hash = "sha256:55592af0bddd2d62bed18e0053c546c9b72041430c5115e54870f7f6163125b0", size = 3754962, upload-time = "2026-05-04T17:39:40.13Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/7a/f3dcefe6ee7389aad3ca1488c177e8fbf978206de21c7a99ccf487ea38ab/pypdfium2-5.8.0-py3-none-win_arm64.whl", hash = "sha256:3f17ed97ae8a5a1705301ca93af256a5b02f9009dee4e99c5e175831d46ebd7c", size = 3548362, upload-time = "2026-05-04T17:39:42.304Z" },
 ]
 
 [[package]]