From e0d227cf9179bb2b26ee9299a86109d6f48f1cd5 Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Thu, 19 Feb 2026 14:39:02 -0700
Subject: [PATCH 1/8] Add Interlinearization model, PT9 refactor, and
 viewing-mode support

- Introduce `Interlinearization` data model.
- Move internal-only PT9 types to dedicated file and change case of props.
- Removed `ScrTextName` prop as it's been deprecated in PT9 since 2020.
- Enhance interlinearizer WebView to support switching between viewing modes: InterlinearData and Interlinearization.
- Update Jest configuration to include path aliases for types and parsers.
- Modify README to clarify the structure of the `src/types/` and `src/parsers/` directories.
- Rename `interlinearXmlParser` and related tests to `paratext9parser`.
- Add new words to cspell configuration for improved spell checking.
---
 README.md                                     |   3 +-
 cspell.json                                   |  13 +-
 jest.config.ts                                |   7 +-
 .../interlinearizer.web-view.test.tsx         | 122 +++--
 .../paratext-9/paratext9Converter.test.ts     | 431 +++++++++++++++
 .../paratext9Parser.test.ts}                  | 228 ++++----
 src/interlinearizer.web-view.tsx              |  72 ++-
 src/parsers/paratext-9/paratext-9-types.ts    |  64 +++
 src/parsers/paratext-9/paratext9Converter.ts  | 286 ++++++++++
 .../paratext9Parser.ts}                       |  50 +-
 src/parsers/{ => paratext-9}/pt9-xml.md       |   5 +-
 src/types/interlinearizer-enums.ts            |  58 ++
 src/types/interlinearizer.d.ts                | 517 ++++++++++++++++--
 tsconfig.json                                 |   5 +-
 14 files changed, 1617 insertions(+), 244 deletions(-)
 create mode 100644 src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
 rename src/__tests__/parsers/{interlinearXmlParser.test.ts => paratext-9/paratext9Parser.test.ts} (78%)
 create mode 100644 src/parsers/paratext-9/paratext-9-types.ts
 create mode 100644 src/parsers/paratext-9/paratext9Converter.ts
 rename src/parsers/{interlinearXmlParser.ts => paratext-9/paratext9Parser.ts} (86%)
 rename src/parsers/{ => paratext-9}/pt9-xml.md (95%)
 create mode 100644 src/types/interlinearizer-enums.ts

diff --git a/README.md b/README.md
index ecc24ea..64ef32c 100644
--- a/README.md
+++ b/README.md
@@ -95,7 +95,8 @@ The general file structure for an extension is as follows:
 - `src/` contains the source code for the extension
   - `src/main.ts` is the main entry file for the extension (registers commands and wires interlinear XML)
   - `src/types/interlinearizer.d.ts` is this extension's types file that defines how other extensions can use this extension through the `papi`. It is copied into the build folder
-  - `src/parsers/interlinearXmlParser.ts` parses interlinear XML into structured data (uses fast-xml-parser). The PT9 XML schema and parsed output are documented in `src/parsers/pt9-xml.md`
+  - `src/types/` also holds shared enums and type modules (e.g. `interlinearizer-enums.ts`). Use the path alias `types/interlinearizer-enums` in imports instead of relative paths (see `tsconfig.json` paths).
+  - `src/parsers/` contains all parsers and converters used when importing external data models sorted by source (e.g. Paratext 9 XML Files). Use the path alias `parsers/...` in imports instead of relative paths (see `tsconfig.json` paths).
   - `*.web-view.tsx` files will be treated as React WebViews
   - `*.web-view.scss` files provide styles for WebViews
   - `*.web-view.html` files are a conventional way to provide HTML WebViews (no special functionality)
diff --git a/cspell.json b/cspell.json
index 8760a2f..4046bd8 100644
--- a/cspell.json
+++ b/cspell.json
@@ -16,7 +16,10 @@
     "appdata",
     "asyncs",
     "autodocs",
+    "BCVWP",
+    "behaviour",
     "dockbox",
+    "Eflomal",
     "electronmon",
     "endregion",
     "finalizer",
@@ -24,10 +27,14 @@
     "guids",
     "hopkinson",
     "iframes",
+    "interlineardata",
     "interlinearization",
+    "interlinearizations",
     "interlinearizer",
+    "jsmith",
     "localstorage",
     "maximizable",
+    "Morphosyntactic",
     "networkable",
     "Newtonsoft",
     "nodebuffer",
@@ -40,6 +47,7 @@
     "pdps",
     "plusplus",
     "proxied",
+    "punc",
     "reinitializing",
     "reserialized",
     "sillsdev",
@@ -47,15 +55,18 @@
     "stringifiable",
     "Stylesheet",
     "typedefs",
+    "unanalyzed",
     "unregistering",
     "unregisters",
+    "unreviewed",
     "unsub",
     "unsubs",
     "unsubscriber",
     "unsubscribers",
     "usfm",
     "verseref",
-    "versification"
+    "versification",
+    "wordform"
   ],
   "ignoreWords": [],
   "import": []
diff --git a/jest.config.ts b/jest.config.ts
index 2e43f5f..ef6987d 100644
--- a/jest.config.ts
+++ b/jest.config.ts
@@ -27,7 +27,7 @@ const config: Config = {
     'src/parsers/**/*.ts',
     'src/main.ts',
     'src/**/*.web-view.tsx',
-    '!src/parsers/**/*.d.ts',
+    '!src/parsers/**/*-types.ts',
     '!src/**/__tests__/**',
     '!src/**/*.test.{ts,tsx}',
     '!src/**/*.spec.{ts,tsx}',
@@ -70,11 +70,12 @@ const config: Config = {
    */
   moduleNameMapper: {
     /**
-     * Resolve src-rooted path aliases so tests can use e.g. "@main" or "parsers/..." instead of
-     * relative paths. Must match tsconfig.json "paths" and webpack resolve.alias.
+     * Resolve src-rooted path aliases so tests can use e.g. "@main", "parsers/...", or "types/..."
+     * instead of relative paths. Must match tsconfig.json "paths" and webpack resolve.alias.
      */
     '^@main$': '<rootDir>/src/main',
     '^parsers/(.*)$': '<rootDir>/src/parsers/$1',
+    '^types/(.*)$': '<rootDir>/src/types/$1',
     '\\.(sa|sc|c)ss$': '<rootDir>/__mocks__/styleMock.ts',
     '\\.(jpg|jpeg|png|gif|eot|otf|webp|svg|ttf|woff|woff2|mp4|webm|wav|mp3|m4a|aac|oga)$':
       '<rootDir>/__mocks__/fileMock.ts',
diff --git a/src/__tests__/interlinearizer.web-view.test.tsx b/src/__tests__/interlinearizer.web-view.test.tsx
index f1a0d32..67cc843 100644
--- a/src/__tests__/interlinearizer.web-view.test.tsx
+++ b/src/__tests__/interlinearizer.web-view.test.tsx
@@ -4,18 +4,38 @@
 
 import type { WebViewProps } from '@papi/core';
 import type { SerializedVerseRef } from '@sillsdev/scripture';
-import { render, screen } from '@testing-library/react';
-import { InterlinearXmlParser } from 'parsers/interlinearXmlParser';
-
-/** Mock parser to allow overriding constructor behavior per test. */
-jest.mock('parsers/interlinearXmlParser', () => {
-  const actual = jest.requireActual<typeof import('parsers/interlinearXmlParser')>(
-    'parsers/interlinearXmlParser',
-  );
-  return {
-    InterlinearXmlParser: jest.fn().mockImplementation(() => new actual.InterlinearXmlParser()),
-  };
-});
+import { fireEvent, render, screen } from '@testing-library/react';
+import type { InterlinearData } from 'paratext-9-types';
+
+/** Stub InterlinearData returned by the mocked parser. Matches shape the WebView displays. */
+const stubInterlinearData: InterlinearData = {
+  glossLanguage: 'en',
+  bookId: 'MAT',
+  verses: {},
+};
+
+/** Stub Interlinearization returned by the mocked converter. Matches shape the WebView displays. */
+const stubInterlinearization = {
+  id: 'mock-interlinear-id',
+  sourceWritingSystem: '',
+  analysisLanguages: ['en'],
+  books: [{ id: 'mock-book-id', bookRef: 'MAT', textVersion: '', segments: [] }],
+};
+
+const mockParse = jest.fn().mockReturnValue(stubInterlinearData);
+const mockConvert = jest.fn().mockReturnValue(stubInterlinearization);
+
+/** Mock parser: no real XML parsing; returns stub data. Parser/converter are tested elsewhere. */
+jest.mock('parsers/paratext-9/paratext9Parser', () => ({
+  Paratext9Parser: jest.fn().mockImplementation(() => ({
+    parse: mockParse,
+  })),
+}));
+
+/** Mock converter: no real conversion; returns stub Interlinearization. */
+jest.mock('parsers/paratext-9/paratext9Converter', () => ({
+  convertParatext9ToInterlinearization: mockConvert,
+}));
 
 /**
  * Load the WebView module; it assigns the component to globalThis.webViewComponent. This pattern is
@@ -66,37 +86,41 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/test-data\/Interlinear_en_MAT\.xml/i)).toBeInTheDocument();
   });
 
-  it('parses the bundled test XML and displays parsed JSON', () => {
+  it('renders the JSON view mode switch (InterlinearData / Interlinearization)', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
-    expect(screen.getByText(/parsed interlinear data \(json\)/i)).toBeInTheDocument();
-    expect(screen.getByText(/"GlossLanguage"/)).toBeInTheDocument();
-    expect(screen.getByText(/"BookId"/)).toBeInTheDocument();
+    const group = screen.getByRole('group', { name: /json view mode/i });
+    expect(group).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /^interlineardata$/i })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /^interlinearization$/i })).toBeInTheDocument();
+    expect(screen.getByText(/view json as:/i)).toBeInTheDocument();
   });
 
-  it('displays parsed structure with expected verse data', () => {
+  it('displays InterlinearData JSON by default when parser returns data', () => {
+    render(<InterlinearizerWebView {...testWebViewProps} />);
+
+    expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+    expect(screen.getByText(/glossLanguage/i)).toBeInTheDocument();
+    expect(screen.getByText(/bookId/i)).toBeInTheDocument();
+  });
+
+  it('displays parsed structure including glossLanguage and bookId values', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
     expect(screen.getByText(/"en"/)).toBeInTheDocument();
     expect(screen.getByText(/"MAT"/)).toBeInTheDocument();
   });
 
-  it('does not show parse error when XML is valid', () => {
+  it('does not show parse error when parser succeeds', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
     expect(screen.queryByText(/^parse error$/i)).not.toBeInTheDocument();
   });
 
   it('displays parse error when parser throws an Error (uses err.message)', () => {
-    const actual = jest.requireActual<typeof import('../parsers/interlinearXmlParser')>(
-      '../parsers/interlinearXmlParser',
-    );
-    const realInstance = new actual.InterlinearXmlParser();
-    const throwingParse = (): never => {
+    mockParse.mockImplementationOnce(() => {
       throw new Error('Invalid XML structure');
-    };
-    Object.defineProperty(realInstance, 'parse', { value: throwingParse, writable: true });
-    jest.mocked(InterlinearXmlParser).mockImplementationOnce(() => realInstance);
+    });
 
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
@@ -104,18 +128,48 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/invalid xml structure/i)).toBeInTheDocument();
   });
 
+  it('switching to Interlinearization shows converted model JSON', () => {
+    render(<InterlinearizerWebView {...testWebViewProps} />);
+
+    fireEvent.click(screen.getByRole('button', { name: /^interlinearization$/i }));
+
+    expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
+    expect(screen.getByText(/analysisLanguages/i)).toBeInTheDocument();
+    expect(screen.getByText(/sourceWritingSystem/i)).toBeInTheDocument();
+    expect(screen.getByText(/segments/i)).toBeInTheDocument();
+  });
+
+  it('switching back to InterlinearData shows PT9 structure JSON', () => {
+    render(<InterlinearizerWebView {...testWebViewProps} />);
+
+    fireEvent.click(screen.getByRole('button', { name: /^interlinearization$/i }));
+    expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
+
+    fireEvent.click(screen.getByRole('button', { name: /^interlineardata$/i }));
+
+    expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+    expect(screen.getByText(/glossLanguage/i)).toBeInTheDocument();
+    expect(screen.getByText(/bookId/i)).toBeInTheDocument();
+  });
+
+  it('renders empty JSON pre when jsonToShow is undefined (converter returns undefined)', () => {
+    mockConvert.mockReturnValueOnce(undefined);
+
+    const { container } = render(<InterlinearizerWebView {...testWebViewProps} />);
+    fireEvent.click(screen.getByRole('button', { name: /^interlinearization$/i }));
+
+    const jsonPre = container.querySelector('pre');
+    expect(jsonPre).toBeInTheDocument();
+    expect(jsonPre).toBeEmptyDOMElement();
+    expect(jsonPre).not.toHaveTextContent('undefined');
+  });
+
   it('displays parse error when parser throws non-Error (uses String(err))', () => {
-    const actual = jest.requireActual<typeof import('../parsers/interlinearXmlParser')>(
-      '../parsers/interlinearXmlParser',
-    );
-    const realInstance = new actual.InterlinearXmlParser();
-    const throwingParse = (): never => {
+    mockParse.mockImplementationOnce(() => {
       // Intentionally throw a non-Error to test the String(err) branch in the catch block.
       // eslint-disable-next-line no-throw-literal -- testing non-Error handling
       throw 'plain string error';
-    };
-    Object.defineProperty(realInstance, 'parse', { value: throwingParse, writable: true });
-    jest.mocked(InterlinearXmlParser).mockImplementationOnce(() => realInstance);
+    });
 
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
diff --git a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
new file mode 100644
index 0000000..7a86cdf
--- /dev/null
+++ b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
@@ -0,0 +1,431 @@
+/** @file Unit tests for {@link convertParatext9ToInterlinearization}. */
+/// <reference types="jest" />
+
+import type { InterlinearData } from 'paratext-9-types';
+import { convertParatext9ToInterlinearization } from 'parsers/paratext-9/paratext9Converter';
+
+describe('convertParatext9ToInterlinearization', () => {
+  describe('top-level structure', () => {
+    it('produces Interlinearization with id, sourceWritingSystem, analysisLanguages, books', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {},
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result).toHaveProperty('id');
+      expect(result).toHaveProperty('sourceWritingSystem', '');
+      expect(result).toHaveProperty('analysisLanguages');
+      expect(Array.isArray(result.analysisLanguages)).toBe(true);
+      expect(result).toHaveProperty('books');
+      expect(Array.isArray(result.books)).toBe(true);
+    });
+
+    it('uses bookId for interlinearization id (lowercase, spaces to dashes)', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'RUT',
+        verses: {},
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.id).toBe('rut-interlinear');
+    });
+
+    it('produces id mat-interlinear when bookId is MAT', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {},
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.id).toBe('mat-interlinear');
+    });
+
+    it('sets analysisLanguages from glossLanguage', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'fr',
+        bookId: 'GEN',
+        verses: {},
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.analysisLanguages).toEqual(['fr']);
+    });
+
+    it('produces exactly one AnalyzedBook with id, bookRef, textVersion, segments', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {},
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books).toHaveLength(1);
+      const book = result.books[0];
+      expect(book).toHaveProperty('id', 'mat');
+      expect(book).toHaveProperty('bookRef', 'MAT');
+      expect(book).toHaveProperty('textVersion');
+      expect(book).toHaveProperty('segments');
+      expect(Array.isArray(book.segments)).toBe(true);
+    });
+  });
+
+  describe('empty verses', () => {
+    it('returns empty segments array and empty textVersion when verses is empty', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {},
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments).toEqual([]);
+      expect(result.books[0].textVersion).toBe('');
+    });
+  });
+
+  describe('verse to segment conversion', () => {
+    it('converts one verse with one cluster to one segment with one word occurrence', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'Word:word', senseId: 'sense1' }],
+                lexemesId: 'Word:word',
+                id: 'Word:word/0-4',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments).toHaveLength(1);
+      const seg = result.books[0].segments[0];
+      expect(seg.id).toBe('mat-1:1');
+      expect(seg.segmentRef).toBe('MAT 1:1');
+      expect(seg.baselineText).toBe('');
+      expect(seg.occurrences).toHaveLength(1);
+
+      const occ = seg.occurrences[0];
+      expect(occ.id).toBe('mat-1:1-occ-0-Word:word/0-4');
+      expect(occ.segmentId).toBe('mat-1:1');
+      expect(occ.index).toBe(0);
+      expect(occ.anchor).toBe('0-4');
+      expect(occ.surfaceText).toBe('');
+      expect(occ.writingSystem).toBe('');
+      expect(occ.type).toBe('word');
+      expect(occ.assignments).toHaveLength(1);
+
+      const assign = occ.assignments[0];
+      expect(assign.occurrenceId).toBe(occ.id);
+      expect(assign.analysisId).toBe('analysis-en-Word:word-sense1');
+      expect(assign.status).toBe('suggested');
+      expect(assign.id).toBe(`assign-${occ.id}-analysis-en-Word:word-sense1`);
+    });
+
+    it('uses verse hash for textVersion and sets assignment status to approved when verse has hash', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: 'ABC123',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'Word:word', senseId: 's1' }],
+                lexemesId: 'Word:word',
+                id: 'Word:word/0-4',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].textVersion).toBe('ABC123');
+      expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('approved');
+    });
+  });
+
+  describe('assignment status from verse hash', () => {
+    it('sets assignment status to suggested when verse has no hash', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'Word:w', senseId: '' }],
+                lexemesId: 'Word:w',
+                id: 'Word:w/0-4',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('suggested');
+    });
+
+    it('sets assignment status to approved when verse has hash', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: 'H1',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'Word:w', senseId: '' }],
+                lexemesId: 'Word:w',
+                id: 'Word:w/0-4',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('approved');
+    });
+  });
+
+  describe('cluster with multiple lexemes', () => {
+    it('creates one word occurrence with multiple assignments (one per lexeme)', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 5, length: 5 },
+                lexemes: [
+                  { lexemeId: 'Stem:hello', senseId: 'g1' },
+                  { lexemeId: 'Suffix:ing', senseId: 'g2' },
+                ],
+                lexemesId: 'Stem:hello/Suffix:ing',
+                id: 'Stem:hello/Suffix:ing/5-5',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      const occ = result.books[0].segments[0].occurrences[0];
+      expect(occ.assignments).toHaveLength(2);
+      expect(occ.assignments.map((a) => a.analysisId)).toEqual([
+        'analysis-en-Stem:hello-g1',
+        'analysis-en-Suffix:ing-g2',
+      ]);
+      expect(occ.anchor).toBe('5-5');
+    });
+  });
+
+  describe('punctuation occurrences', () => {
+    it('converts punctuations to punctuation occurrences after word occurrences (surfaceText from afterText when present)', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 1 },
+                lexemes: [{ lexemeId: 'x', senseId: '' }],
+                lexemesId: 'x',
+                id: 'x/0-1',
+                excluded: false,
+              },
+            ],
+            punctuations: [
+              {
+                textRange: { index: 34, length: 2 },
+                beforeText: '? ',
+                afterText: '? ',
+              },
+            ],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      const seg = result.books[0].segments[0];
+      expect(seg.occurrences).toHaveLength(2);
+
+      const puncOcc = seg.occurrences[1];
+      expect(puncOcc.type).toBe('punctuation');
+      expect(puncOcc.anchor).toBe('34-2');
+      expect(puncOcc.surfaceText).toBe('? '); // afterText preferred in implementation
+      expect(puncOcc.assignments).toEqual([]);
+      expect(puncOcc.index).toBe(1);
+      expect(puncOcc.id).toBe('mat-1:1-punc-1-34-2');
+    });
+
+    it('uses beforeText for surfaceText when afterText is empty', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [],
+            punctuations: [{ textRange: { index: 0, length: 1 }, beforeText: ',', afterText: '' }],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments[0].occurrences[0].surfaceText).toBe(',');
+    });
+
+    it('uses empty surfaceText when both beforeText and afterText are empty', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [],
+            punctuations: [{ textRange: { index: 0, length: 1 }, beforeText: '', afterText: '' }],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments[0].occurrences[0].surfaceText).toBe('');
+    });
+  });
+
+  describe('verse with no clusters', () => {
+    it('produces segment with empty occurrences when verse has no clusters and no punctuations', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments).toHaveLength(1);
+      expect(result.books[0].segments[0].occurrences).toEqual([]);
+      expect(result.books[0].segments[0].id).toBe('mat-1:1');
+      expect(result.books[0].segments[0].segmentRef).toBe('MAT 1:1');
+    });
+  });
+
+  describe('lexeme without senseId', () => {
+    it('generates analysis id without sense suffix when senseId is empty', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 1 },
+                lexemes: [{ lexemeId: 'Word:a', senseId: '' }],
+                lexemesId: 'Word:a',
+                id: 'Word:a/0-1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments[0].occurrences[0].assignments[0].analysisId).toBe(
+        'analysis-en-Word:a',
+      );
+    });
+  });
+
+  describe('segment and occurrence IDs', () => {
+    it('generates segment id from verseRef (lowercase, spaces to dashes)', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'W:w', senseId: '' }],
+                lexemesId: 'W:w',
+                id: 'W:w/0-4',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      expect(result.books[0].segments[0].id).toBe('mat-1:1');
+    });
+
+    it('generates occurrence id from segmentId, cluster id, and index', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'Word:word', senseId: 's1' }],
+                lexemesId: 'Word:word',
+                id: 'Word:word/0-4',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = convertParatext9ToInterlinearization(data);
+
+      const segId = result.books[0].segments[0].id;
+      expect(result.books[0].segments[0].occurrences[0].id).toBe(`${segId}-occ-0-Word:word/0-4`);
+    });
+  });
+});
diff --git a/src/__tests__/parsers/interlinearXmlParser.test.ts b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
similarity index 78%
rename from src/__tests__/parsers/interlinearXmlParser.test.ts
rename to src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
index 875789f..eed880b 100644
--- a/src/__tests__/parsers/interlinearXmlParser.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
@@ -1,16 +1,16 @@
-/** @file Unit tests for {@link InterlinearXmlParser}. */
+/** @file Unit tests for {@link Paratext9Parser}. */
 /// <reference types="jest" />
 
 import * as fs from 'fs';
 import * as path from 'path';
 
-import { InterlinearXmlParser } from 'parsers/interlinearXmlParser';
+import { Paratext9Parser } from 'parsers/paratext-9/paratext9Parser';
 
-describe('InterlinearXmlParser', () => {
-  let parser: InterlinearXmlParser;
+describe('Paratext9Parser', () => {
+  let parser: Paratext9Parser;
 
   beforeEach(() => {
-    parser = new InterlinearXmlParser();
+    parser = new Paratext9Parser();
   });
 
   describe('parse() - valid XML', () => {
@@ -33,30 +33,29 @@ describe('InterlinearXmlParser', () => {
       const result = parser.parse(xml);
 
       expect(result).toEqual({
-        ScrTextName: '',
-        GlossLanguage: 'en',
-        BookId: 'MAT',
-        Verses: {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
           'MAT 1:1': {
-            Hash: '',
-            Clusters: [
+            hash: '',
+            clusters: [
               {
-                TextRange: { Index: 0, Length: 4 },
-                Lexemes: [{ LexemeId: 'Word:word', SenseId: 'sense1' }],
-                LexemesId: 'Word:word',
-                Id: 'Word:word/0-4',
-                Excluded: false,
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'Word:word', senseId: 'sense1' }],
+                lexemesId: 'Word:word',
+                id: 'Word:word/0-4',
+                excluded: false,
               },
             ],
-            Punctuations: [],
+            punctuations: [],
           },
         },
       });
     });
 
-    it('parses optional ScrTextName and verse Hash', () => {
+    it('parses verse Hash', () => {
       const xml = `
-        <InterlinearData ScrTextName="MyProject" GlossLanguage="en" BookId="RUT">
+        <InterlinearData GlossLanguage="en" BookId="RUT">
           <Verses>
             <item>
               <string>RUT 3:1</string>
@@ -72,13 +71,12 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.ScrTextName).toBe('MyProject');
-      expect(result.Verses['RUT 3:1'].Hash).toBe('ABC123');
+      expect(result.verses['RUT 3:1'].hash).toBe('ABC123');
     });
 
     it('parses purely numeric verse Hash', () => {
       const xml = `
-        <InterlinearData ScrTextName="MyProject" GlossLanguage="en" BookId="RUT">
+        <InterlinearData GlossLanguage="en" BookId="RUT">
           <Verses>
             <item>
               <string>RUT 3:1</string>
@@ -94,8 +92,7 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.ScrTextName).toBe('MyProject');
-      expect(result.Verses['RUT 3:1'].Hash).toBe('123456');
+      expect(result.verses['RUT 3:1'].hash).toBe('123456');
     });
 
     it('parses cluster with multiple lexemes and builds LexemesId and Id correctly', () => {
@@ -117,13 +114,13 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      const cluster = result.Verses['MAT 1:1'].Clusters[0];
-      expect(cluster.Lexemes).toEqual([
-        { LexemeId: 'Stem:hello', SenseId: 'g1' },
-        { LexemeId: 'Suffix:ing', SenseId: 'g2' },
+      const cluster = result.verses['MAT 1:1'].clusters[0];
+      expect(cluster.lexemes).toEqual([
+        { lexemeId: 'Stem:hello', senseId: 'g1' },
+        { lexemeId: 'Suffix:ing', senseId: 'g2' },
       ]);
-      expect(cluster.LexemesId).toBe('Stem:hello/Suffix:ing');
-      expect(cluster.Id).toBe('Stem:hello/Suffix:ing/5-5');
+      expect(cluster.lexemesId).toBe('Stem:hello/Suffix:ing');
+      expect(cluster.id).toBe('Stem:hello/Suffix:ing/5-5');
     });
 
     it('parses lexeme Id containing slash: LexemesId and Id preserve the slash (slash-safe)', () => {
@@ -144,10 +141,10 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      const cluster = result.Verses['MAT 1:1'].Clusters[0];
-      expect(cluster.Lexemes).toEqual([{ LexemeId: 'Word:hello/world', SenseId: 'g1' }]);
-      expect(cluster.LexemesId).toBe('Word:hello/world');
-      expect(cluster.Id).toBe('Word:hello/world/0-12');
+      const cluster = result.verses['MAT 1:1'].clusters[0];
+      expect(cluster.lexemes).toEqual([{ lexemeId: 'Word:hello/world', senseId: 'g1' }]);
+      expect(cluster.lexemesId).toBe('Word:hello/world');
+      expect(cluster.id).toBe('Word:hello/world/0-12');
     });
 
     it('preserves slash when joining Lexeme Ids (multiple lexemes, one Id contains slash)', () => {
@@ -169,13 +166,13 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      const cluster = result.Verses['MAT 1:1'].Clusters[0];
-      expect(cluster.Lexemes).toEqual([
-        { LexemeId: 'Stem:foo/bar', SenseId: 'g1' },
-        { LexemeId: 'Suffix:ing', SenseId: 'g2' },
+      const cluster = result.verses['MAT 1:1'].clusters[0];
+      expect(cluster.lexemes).toEqual([
+        { lexemeId: 'Stem:foo/bar', senseId: 'g1' },
+        { lexemeId: 'Suffix:ing', senseId: 'g2' },
       ]);
-      expect(cluster.LexemesId).toBe('Stem:foo/bar/Suffix:ing');
-      expect(cluster.Id).toBe('Stem:foo/bar/Suffix:ing/5-11');
+      expect(cluster.lexemesId).toBe('Stem:foo/bar/Suffix:ing');
+      expect(cluster.id).toBe('Stem:foo/bar/Suffix:ing/5-11');
     });
 
     it('parses cluster with no lexemes: Id is Index-Length only (no leading slash)', () => {
@@ -195,10 +192,10 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      const cluster = result.Verses['MAT 1:1'].Clusters[0];
-      expect(cluster.Lexemes).toEqual([]);
-      expect(cluster.LexemesId).toBe('');
-      expect(cluster.Id).toBe('10-3');
+      const cluster = result.verses['MAT 1:1'].clusters[0];
+      expect(cluster.lexemes).toEqual([]);
+      expect(cluster.lexemesId).toBe('');
+      expect(cluster.id).toBe('10-3');
     });
 
     it('parses Lexeme without GlossId as empty SenseId', () => {
@@ -219,9 +216,9 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Clusters[0].Lexemes[0]).toEqual({
-        LexemeId: 'Word:a',
-        SenseId: '',
+      expect(result.verses['MAT 1:1'].clusters[0].lexemes[0]).toEqual({
+        lexemeId: 'Word:a',
+        senseId: '',
       });
     });
 
@@ -244,7 +241,7 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Clusters[0].Excluded).toBe(true);
+      expect(result.verses['MAT 1:1'].clusters[0].excluded).toBe(true);
     });
 
     it('parses Cluster with Excluded=false', () => {
@@ -266,7 +263,7 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Clusters[0].Excluded).toBe(false);
+      expect(result.verses['MAT 1:1'].clusters[0].excluded).toBe(false);
     });
 
     it('parses Cluster without Excluded as Excluded=false', () => {
@@ -287,7 +284,7 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Clusters[0].Excluded).toBe(false);
+      expect(result.verses['MAT 1:1'].clusters[0].excluded).toBe(false);
     });
 
     it('parses Punctuation with Range, BeforeText, AfterText', () => {
@@ -314,11 +311,11 @@ describe('InterlinearXmlParser', () => {
       const result = parser.parse(xml);
 
       // Parser uses trimValues: false, so tag text is not trimmed.
-      expect(result.Verses['MAT 1:1'].Punctuations).toEqual([
+      expect(result.verses['MAT 1:1'].punctuations).toEqual([
         {
-          TextRange: { Index: 34, Length: 2 },
-          BeforeText: '? ',
-          AfterText: '? ',
+          textRange: { index: 34, length: 2 },
+          beforeText: '? ',
+          afterText: '? ',
         },
       ]);
     });
@@ -350,11 +347,11 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Punctuations).toHaveLength(1);
-      expect(result.Verses['MAT 1:1'].Punctuations[0]).toEqual({
-        TextRange: { Index: 1, Length: 2 },
-        BeforeText: 'c',
-        AfterText: 'd',
+      expect(result.verses['MAT 1:1'].punctuations).toHaveLength(1);
+      expect(result.verses['MAT 1:1'].punctuations[0]).toEqual({
+        textRange: { index: 1, length: 2 },
+        beforeText: 'c',
+        afterText: 'd',
       });
     });
 
@@ -396,11 +393,11 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Punctuations).toHaveLength(1);
-      expect(result.Verses['MAT 1:1'].Punctuations[0]).toEqual({
-        TextRange: { Index: 5, Length: 1 },
-        BeforeText: 'valid',
-        AfterText: '',
+      expect(result.verses['MAT 1:1'].punctuations).toHaveLength(1);
+      expect(result.verses['MAT 1:1'].punctuations[0]).toEqual({
+        textRange: { index: 5, length: 1 },
+        beforeText: 'valid',
+        afterText: '',
       });
     });
 
@@ -425,11 +422,11 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Punctuations).toHaveLength(1);
-      expect(result.Verses['MAT 1:1'].Punctuations[0]).toEqual({
-        TextRange: { Index: 10, Length: 1 },
-        BeforeText: '',
-        AfterText: '',
+      expect(result.verses['MAT 1:1'].punctuations).toHaveLength(1);
+      expect(result.verses['MAT 1:1'].punctuations[0]).toEqual({
+        textRange: { index: 10, length: 1 },
+        beforeText: '',
+        afterText: '',
       });
     });
 
@@ -460,9 +457,9 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(Object.keys(result.Verses)).toEqual(['MAT 1:1', 'MAT 1:2']);
-      expect(result.Verses['MAT 1:1'].Clusters[0].Lexemes[0].LexemeId).toBe('a');
-      expect(result.Verses['MAT 1:2'].Clusters[0].Lexemes[0].LexemeId).toBe('b');
+      expect(Object.keys(result.verses)).toEqual(['MAT 1:1', 'MAT 1:2']);
+      expect(result.verses['MAT 1:1'].clusters[0].lexemes[0].lexemeId).toBe('a');
+      expect(result.verses['MAT 1:2'].clusters[0].lexemes[0].lexemeId).toBe('b');
     });
 
     it('parses item with missing VerseData as empty Hash, Clusters, Punctuations', () => {
@@ -477,10 +474,10 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1']).toEqual({
-        Hash: '',
-        Clusters: [],
-        Punctuations: [],
+      expect(result.verses['MAT 1:1']).toEqual({
+        hash: '',
+        clusters: [],
+        punctuations: [],
       });
     });
 
@@ -497,10 +494,10 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:11']).toEqual({
-        Hash: '',
-        Clusters: [],
-        Punctuations: [],
+      expect(result.verses['MAT 1:11']).toEqual({
+        hash: '',
+        clusters: [],
+        punctuations: [],
       });
     });
 
@@ -523,12 +520,12 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses['MAT 1:1'].Clusters).toEqual([]);
-      expect(result.Verses['MAT 1:1'].Punctuations).toHaveLength(1);
-      expect(result.Verses['MAT 1:1'].Punctuations[0]).toEqual({
-        TextRange: { Index: 0, Length: 1 },
-        BeforeText: ',',
-        AfterText: ',',
+      expect(result.verses['MAT 1:1'].clusters).toEqual([]);
+      expect(result.verses['MAT 1:1'].punctuations).toHaveLength(1);
+      expect(result.verses['MAT 1:1'].punctuations[0]).toEqual({
+        textRange: { index: 0, length: 1 },
+        beforeText: ',',
+        afterText: ',',
       });
     });
 
@@ -542,9 +539,9 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(result.Verses).toEqual({});
-      expect(result.GlossLanguage).toBe('en');
-      expect(result.BookId).toBe('MAT');
+      expect(result.verses).toEqual({});
+      expect(result.glossLanguage).toBe('en');
+      expect(result.bookId).toBe('MAT');
     });
 
     it('skips items with missing string (verse key)', () => {
@@ -573,40 +570,47 @@ describe('InterlinearXmlParser', () => {
       `;
       const result = parser.parse(xml);
 
-      expect(Object.keys(result.Verses)).toEqual(['MAT 1:1']);
-      expect(result.Verses['MAT 1:1'].Clusters[0].Lexemes[0].LexemeId).toBe('y');
+      expect(Object.keys(result.verses)).toEqual(['MAT 1:1']);
+      expect(result.verses['MAT 1:1'].clusters[0].lexemes[0].lexemeId).toBe('y');
     });
 
     it('parses real test-data file without throwing', () => {
-      const xmlPath = path.join(__dirname, '..', '..', '..', 'test-data', 'Interlinear_en_MAT.xml');
+      const xmlPath = path.join(
+        __dirname,
+        '..',
+        '..',
+        '..',
+        '..',
+        'test-data',
+        'Interlinear_en_MAT.xml',
+      );
       const xml = fs.readFileSync(xmlPath, 'utf-8');
       const result = parser.parse(xml);
 
-      expect(result.GlossLanguage).toBe('en');
-      expect(result.BookId).toBe('MAT');
-      expect(result.ScrTextName).toBe('');
-      expect(Object.keys(result.Verses).length).toBeGreaterThan(0);
+      expect(result.glossLanguage).toBe('en');
+      expect(result.bookId).toBe('MAT');
+      expect(Object.keys(result.verses).length).toBeGreaterThan(0);
 
-      const mat11 = result.Verses['MAT 1:1'];
+      const mat11 = result.verses['MAT 1:1'];
       expect(mat11).toBeDefined();
-      expect(mat11.Hash).toBe('C8D38188');
-      expect(mat11.Clusters.length).toBeGreaterThan(0);
-      const firstCluster = mat11.Clusters[0];
-      expect(firstCluster.TextRange).toEqual({ Index: 5, Length: 5 });
-      expect(firstCluster.Lexemes[0]).toEqual({
-        LexemeId: 'Word:hello',
-        SenseId: 'WvbPwa9D',
+      expect(mat11.hash).toBe('C8D38188');
+      expect(mat11.clusters.length).toBeGreaterThan(0);
+      const firstCluster = mat11.clusters[0];
+      expect(firstCluster.textRange).toEqual({ index: 5, length: 5 });
+      expect(firstCluster.lexemes[0]).toEqual({
+        lexemeId: 'Word:hello',
+        senseId: 'WvbPwa9D',
       });
-      expect(firstCluster.Id).toMatch(/^Word:hello\/5-5$/);
+      expect(firstCluster.id).toMatch(/^Word:hello\/5-5$/);
 
-      const versesWithPunctuation = Object.values(result.Verses).filter(
-        (v) => v.Punctuations.length > 0,
+      const versesWithPunctuation = Object.values(result.verses).filter(
+        (v) => v.punctuations.length > 0,
       );
       expect(versesWithPunctuation.length).toBeGreaterThan(0);
       const [firstWithPunctuation] = versesWithPunctuation;
-      expect(firstWithPunctuation.Punctuations[0]).toHaveProperty('TextRange');
-      expect(firstWithPunctuation.Punctuations[0]).toHaveProperty('BeforeText');
-      expect(firstWithPunctuation.Punctuations[0]).toHaveProperty('AfterText');
+      expect(firstWithPunctuation.punctuations[0]).toHaveProperty('textRange');
+      expect(firstWithPunctuation.punctuations[0]).toHaveProperty('beforeText');
+      expect(firstWithPunctuation.punctuations[0]).toHaveProperty('afterText');
     });
   });
 
@@ -802,8 +806,8 @@ describe('InterlinearXmlParser', () => {
 
   describe('constructor and instance', () => {
     it('can be instantiated multiple times', () => {
-      const p1 = new InterlinearXmlParser();
-      const p2 = new InterlinearXmlParser();
+      const p1 = new Paratext9Parser();
+      const p2 = new Paratext9Parser();
       const xml = `
         <InterlinearData GlossLanguage="en" BookId="MAT">
           <Verses>
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index f47bd69..4d1a14d 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -1,6 +1,7 @@
-import { useMemo } from 'react';
-import type { InterlinearData } from 'interlinearizer';
-import { InterlinearXmlParser } from './parsers/interlinearXmlParser';
+import { useMemo, useState } from 'react';
+import type { InterlinearData } from 'paratext-9-types';
+import { Paratext9Parser } from './parsers/paratext-9/paratext9Parser';
+import { convertParatext9ToInterlinearization } from './parsers/paratext-9/paratext9Converter';
 
 /** Test interlinear XML bundled at build time (from test-data/Interlinear_en_MAT.xml). */
 import testXml from '../test-data/Interlinear_en_MAT.xml?raw';
@@ -8,15 +9,22 @@ import testXml from '../test-data/Interlinear_en_MAT.xml?raw';
 /** Result of parsing the bundled test XML: either data or an error message. */
 type ParseResult = { data: InterlinearData; error: undefined } | { data: undefined; error: string };
 
+/** View mode for the JSON display: raw PT9 structure or converted interlinearizer model. */
+type JsonViewMode = 'interlinear-data' | 'interlinearization';
+
 /**
  * Main interlinearizer WebView. Parses the bundled test XML into the interlinear model and displays
  * the result as raw JSON. No PAPI commands or file loading—everything is self-contained.
  *
- * Parser is created inside useMemo so parsing runs once per mount.
+ * A switch lets the user choose between viewing {@link InterlinearData} (Paratext 9 format) or
+ * {@link Interlinearization} (converted interlinearizer model). Parser is created inside useMemo so
+ * parsing runs once per mount.
  */
 globalThis.webViewComponent = function InterlinearizerWebView() {
+  const [jsonViewMode, setJsonViewMode] = useState<JsonViewMode>('interlinear-data');
+
   const { data: parsed, error: parseError } = useMemo((): ParseResult => {
-    const parser = new InterlinearXmlParser();
+    const parser = new Paratext9Parser();
     try {
       const data = parser.parse(testXml);
       return { data, error: undefined };
@@ -25,6 +33,14 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
     }
   }, []);
 
+  const interlinearization = useMemo(
+    () => (parsed ? convertParatext9ToInterlinearization(parsed) : undefined),
+    [parsed],
+  );
+
+  /** In Interlinearization mode use converted data (may be undefined); otherwise use parsed. */
+  const jsonToShow = jsonViewMode === 'interlinearization' ? interlinearization : parsed;
+
   return (
     <div className="tw-flex tw-flex-col tw-gap-4 tw-p-6">
       <h1 className="tw-text-2xl tw-font-semibold tw-tracking-tight">Interlinearizer</h1>
@@ -43,9 +59,51 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
 
       {parsed && (
         <>
-          <p className="tw-text-sm tw-text-muted-foreground">Parsed interlinear data (JSON):</p>
+          <div className="tw-flex tw-flex-wrap tw-items-center tw-gap-2">
+            <span className="tw-text-sm tw-font-medium tw-text-foreground">View JSON as:</span>
+            <div
+              className="tw-inline-flex tw-rounded-md tw-border tw-border-border tw-bg-muted tw-p-0.5"
+              role="group"
+              aria-label="JSON view mode"
+            >
+              <button
+                type="button"
+                onClick={() => setJsonViewMode('interlinear-data')}
+                className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
+                  jsonViewMode === 'interlinear-data'
+                    ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
+                    : 'tw-text-muted-foreground hover:tw-text-foreground'
+                }`}
+                aria-pressed={jsonViewMode === 'interlinear-data'}
+              >
+                InterlinearData
+              </button>
+              <button
+                type="button"
+                onClick={() => setJsonViewMode('interlinearization')}
+                className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
+                  jsonViewMode === 'interlinearization'
+                    ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
+                    : 'tw-text-muted-foreground hover:tw-text-foreground'
+                }`}
+                aria-pressed={jsonViewMode === 'interlinearization'}
+              >
+                Interlinearization
+              </button>
+            </div>
+            <p className="tw-text-xs tw-text-muted-foreground">
+              {jsonViewMode === 'interlinear-data'
+                ? 'Paratext 9 book/verse/cluster structure.'
+                : 'Converted interlinearizer book/segment/occurrence model.'}
+            </p>
+          </div>
+          <p className="tw-text-sm tw-text-muted-foreground">
+            {jsonViewMode === 'interlinear-data'
+              ? 'InterlinearData (JSON):'
+              : 'Interlinearization (JSON):'}
+          </p>
           <pre className="tw-overflow-auto tw-rounded-md tw-border tw-border-border tw-bg-muted tw-p-4 tw-text-sm tw-font-mono tw-leading-relaxed">
-            {JSON.stringify(parsed, undefined, 2)}
+            {jsonToShow ? JSON.stringify(jsonToShow, undefined, 2) : ''}
           </pre>
         </>
       )}
diff --git a/src/parsers/paratext-9/paratext-9-types.ts b/src/parsers/paratext-9/paratext-9-types.ts
new file mode 100644
index 0000000..263bbd7
--- /dev/null
+++ b/src/parsers/paratext-9/paratext-9-types.ts
@@ -0,0 +1,64 @@
+declare module 'paratext-9-types' {
+  /** Character range in source text (Index, Length). */
+  export interface StringRange {
+    /** Start index of the range in the source text (0-based). */
+    index: number;
+    /** Number of characters in the range. */
+    length: number;
+  }
+
+  /** Data on the interlinearization of a single lexeme. */
+  export interface LexemeData {
+    /** ID of the lexeme (e.g. from Lexicon; XML attribute Id). */
+    lexemeId: string;
+    /** ID of the sense/gloss used for this lexeme (XML attribute GlossId). */
+    senseId: string;
+  }
+
+  /** Data on the interlinearization of a cluster. */
+  export interface ClusterData {
+    /** Character range this cluster occupies in the verse text. */
+    textRange: StringRange;
+    /** Lexemes in this cluster, in order. */
+    lexemes: LexemeData[];
+    /** Slash-joined LexemeIds for this cluster (e.g. "Word:a/Word:b"). */
+    lexemesId: string;
+    /** Unique cluster id: LexemesId plus TextRange (e.g. "Word:a/Word:b/21-3"). */
+    id: string;
+    /** Excluded flag. See [pt9-xml.md](../parsers/pt9-xml.md) for details. */
+    excluded: boolean;
+  }
+
+  /** Data on punctuation change. */
+  export interface PunctuationData {
+    /** Character range this punctuation occupies in the verse text. */
+    textRange: StringRange;
+    /** Punctuation text before the change (or empty). */
+    beforeText: string;
+    /** Punctuation text after the change (or empty). */
+    afterText: string;
+  }
+
+  /** Interlinear data for a single verse. */
+  export interface VerseData {
+    /** Hash of verse text when approved; empty string if not approved. */
+    hash: string;
+    /** Lexeme clusters in this verse. */
+    clusters: ClusterData[];
+    /** Punctuation changes in this verse. */
+    punctuations: PunctuationData[];
+  }
+
+  /** Root interlinear data: book + verses. */
+  export interface InterlinearData {
+    /** Language code or name for the glosses. */
+    glossLanguage: string;
+    /** Book id (e.g. "RUT", "MAT"). */
+    bookId: string;
+    /**
+     * Verse data keyed by verse reference (e.g. "RUT 3:1"). Exactly one entry per reference; the
+     * parser rejects XML that contains duplicate verse references.
+     */
+    verses: Record<string, VerseData>;
+  }
+}
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
new file mode 100644
index 0000000..ea8d010
--- /dev/null
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -0,0 +1,286 @@
+/**
+ * @file Converts Paratext 9 interlinear data structures to the interlinearizer model.
+ *
+ *   This module converts from {@link InterlinearData} (paratext-9-types) to {@link Interlinearization}
+ *   (interlinearizer types), mapping Paratext 9's verse/cluster/lexeme structure to the
+ *   interlinearizer's book/segment/occurrence/analysis structure.
+ */
+
+import type { InterlinearData, VerseData, StringRange } from 'paratext-9-types';
+import type {
+  Interlinearization,
+  AnalyzedBook,
+  Segment,
+  Analysis,
+  Occurrence,
+  AnalysisAssignment,
+} from 'interlinearizer';
+import {
+  OccurrenceType,
+  AnalysisType,
+  AssignmentStatus,
+  Confidence,
+} from 'types/interlinearizer-enums';
+
+/**
+ * Generates a deterministic ID for an interlinearization from Paratext 9 data.
+ *
+ * @param bookId - Book ID from InterlinearData.
+ * @returns A unique ID for the interlinearization.
+ */
+function generateInterlinearizationId(bookId: string): string {
+  return `${bookId}-interlinear`.toLowerCase().replace(/\s+/g, '-');
+}
+
+/**
+ * Generates a deterministic ID for an analyzed book.
+ *
+ * @param bookId - Book ID.
+ * @returns A unique ID for the book.
+ */
+function generateBookId(bookId: string): string {
+  return bookId.toLowerCase().replace(/\s+/g, '-');
+}
+
+/**
+ * Generates a deterministic ID for a segment (verse).
+ *
+ * @param bookId - Book ID.
+ * @param verseRef - Verse reference (e.g., "MAT 1:1").
+ * @returns A unique ID for the segment.
+ */
+function generateSegmentId(verseRef: string): string {
+  return verseRef.toLowerCase().replace(/\s+/g, '-');
+}
+
+/**
+ * Generates a deterministic ID for an occurrence from a cluster.
+ *
+ * @param segmentId - Parent segment ID.
+ * @param clusterId - Cluster ID from ClusterData.
+ * @param index - Zero-based index within the segment.
+ * @returns A unique ID for the occurrence.
+ */
+function generateOccurrenceIdFromCluster(
+  segmentId: string,
+  clusterId: string,
+  index: number,
+): string {
+  return `${segmentId}-occ-${index}-${clusterId}`;
+}
+
+/**
+ * Generates a deterministic ID for an occurrence from punctuation.
+ *
+ * @param segmentId - Parent segment ID.
+ * @param textRange - Text range of the punctuation.
+ * @param index - Zero-based index within the segment.
+ * @returns A unique ID for the occurrence.
+ */
+function generateOccurrenceIdFromPunctuation(
+  segmentId: string,
+  textRange: StringRange,
+  index: number,
+): string {
+  return `${segmentId}-punc-${index}-${textRange.index}-${textRange.length}`;
+}
+
+/**
+ * Generates a deterministic ID for an analysis from lexeme data.
+ *
+ * @param lexemeId - Lexeme ID.
+ * @param senseId - Sense/gloss ID.
+ * @param glossLanguage - Gloss language code.
+ * @returns A unique ID for the analysis.
+ */
+function generateAnalysisId(lexemeId: string, senseId: string, glossLanguage: string): string {
+  const sensePart = senseId ? `-${senseId}` : '';
+  return `analysis-${glossLanguage}-${lexemeId}${sensePart}`;
+}
+
+/**
+ * Generates a deterministic ID for an analysis assignment.
+ *
+ * @param occurrenceId - Occurrence ID.
+ * @param analysisId - Analysis ID.
+ * @returns A unique ID for the assignment.
+ */
+function generateAssignmentId(occurrenceId: string, analysisId: string): string {
+  return `assign-${occurrenceId}-${analysisId}`;
+}
+
+/**
+ * Converts a text range to an anchor string.
+ *
+ * @param textRange - Character range in source text.
+ * @returns Anchor string in format "index-length".
+ */
+function textRangeToAnchor(textRange: StringRange): string {
+  return `${textRange.index}-${textRange.length}`;
+}
+
+/**
+ * Converts a Paratext 9 verse to an interlinearizer segment.
+ *
+ * @param verseRef - Verse reference (e.g., "MAT 1:1").
+ * @param verseData - Verse data from Paratext 9.
+ * @param bookId - Book ID for generating segment ID.
+ * @param glossLanguage - Gloss language code.
+ * @returns A Segment with occurrences converted from clusters and punctuations.
+ */
+function convertVerseToSegment(
+  verseRef: string,
+  verseData: VerseData,
+  glossLanguage: string,
+): Segment {
+  const segmentId = generateSegmentId(verseRef);
+
+  const wordOccurrences = verseData.clusters.map((cluster, clusterIndex): Occurrence => {
+    const assignments = cluster.lexemes.map((lexeme): AnalysisAssignment => {
+      const analysisId = generateAnalysisId(lexeme.lexemeId, lexeme.senseId, glossLanguage);
+      const assignmentId = generateAssignmentId(
+        generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex),
+        analysisId,
+      );
+
+      return {
+        id: assignmentId,
+        occurrenceId: generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex),
+        analysisId,
+        status: verseData.hash ? AssignmentStatus.Approved : AssignmentStatus.Suggested,
+      };
+    });
+
+    const occurrenceId = generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex);
+
+    return {
+      id: occurrenceId,
+      segmentId,
+      index: clusterIndex,
+      anchor: textRangeToAnchor(cluster.textRange),
+      surfaceText: '', // Paratext 9 doesn't specify surface text per cluster
+      writingSystem: '', // Paratext 9 doesn't specify writing system per cluster
+      type: OccurrenceType.Word,
+      assignments,
+    };
+  });
+
+  const punctuationOccurrences: Occurrence[] = verseData.punctuations.map(
+    (punctuation, puncIndex): Occurrence => {
+      const occurrenceIndex = wordOccurrences.length + puncIndex;
+
+      return {
+        id: generateOccurrenceIdFromPunctuation(segmentId, punctuation.textRange, occurrenceIndex),
+        segmentId,
+        index: occurrenceIndex,
+        anchor: textRangeToAnchor(punctuation.textRange),
+        surfaceText: punctuation.afterText || punctuation.beforeText || '',
+        writingSystem: '',
+        type: OccurrenceType.Punctuation,
+        assignments: [],
+      };
+    },
+  );
+
+  const occurrences = [...wordOccurrences, ...punctuationOccurrences];
+
+  return {
+    id: segmentId,
+    segmentRef: verseRef,
+    baselineText: '', // Paratext 9 doesn't specify baseline text
+    occurrences,
+  };
+}
+
+/**
+ * Creates Analysis objects for all unique lexemes across all verses.
+ *
+ * @param interlinearData - Paratext 9 interlinear data.
+ * @returns Map of analysis ID to Analysis object.
+ */
+function createAnalyses(interlinearData: InterlinearData): Map<string, Analysis> {
+  const analyses = new Map<string, Analysis>();
+  const { glossLanguage } = interlinearData;
+
+  // Collect all unique lexeme-sense pairs
+  Object.values(interlinearData.verses).forEach((verseData) => {
+    verseData.clusters.forEach((cluster) => {
+      cluster.lexemes.forEach((lexeme) => {
+        const analysisId = generateAnalysisId(lexeme.lexemeId, lexeme.senseId, glossLanguage);
+
+        if (!analyses.has(analysisId)) {
+          const analysis: Analysis = {
+            id: analysisId,
+            analysisLanguage: glossLanguage,
+            analysisType: AnalysisType.Gloss, // Paratext 9 provides word-level glosses
+            confidence: Confidence.Medium, // Default confidence level
+            sourceSystem: 'paratext-9',
+            sourceUser: 'paratext-9-parser',
+            glossText: lexeme.senseId || undefined, // Use senseId as gloss text placeholder
+            // Note: Paratext 9 doesn't provide POS, features, or morpheme bundles in the XML
+          };
+
+          analyses.set(analysisId, analysis);
+        }
+      });
+    });
+  });
+
+  return analyses;
+}
+
+/**
+ * Converts Paratext 9 InterlinearData to interlinearizer Interlinearization.
+ *
+ * This function performs the following mappings:
+ *
+ * - InterlinearData → Interlinearization (one per book)
+ * - VerseData → Segment (one per verse)
+ * - ClusterData → Occurrence (word type) with AnalysisAssignments
+ * - PunctuationData → Occurrence (punctuation type)
+ * - LexemeData → Analysis + AnalysisAssignment
+ *
+ * Note: Analysis objects are created but not directly attached to the Interlinearization. They are
+ * referenced via AnalysisAssignment.analysisId. In a full implementation, you might want to store
+ * them in a separate collection or attach them to a parent structure.
+ *
+ * @param interlinearData - Paratext 9 interlinear data to convert.
+ * @param baselineTexts - Optional map of verse references to baseline text (for extracting
+ *   surfaceText). If not provided, surfaceText will be empty strings.
+ * @returns Converted Interlinearization object.
+ */
+export function convertParatext9ToInterlinearization(
+  interlinearData: InterlinearData,
+): Interlinearization {
+  const { glossLanguage, bookId, verses } = interlinearData;
+
+  const interlinearizationId = generateInterlinearizationId(bookId);
+  const analyzedBookId = generateBookId(bookId);
+
+  // Note: analyses are created but not returned - they're referenced via analysisId in assignments
+  createAnalyses(interlinearData);
+
+  const segments = Object.entries(verses).map(([verseRef, verseData]) => {
+    return convertVerseToSegment(verseRef, verseData, glossLanguage);
+  });
+
+  const verseDataArray = Object.values(verses);
+  const verseWithHash = verseDataArray.find((verseData) => verseData.hash);
+  const textVersion = verseWithHash?.hash || '';
+
+  const analyzedBook: AnalyzedBook = {
+    id: analyzedBookId,
+    bookRef: bookId,
+    textVersion,
+    segments,
+  };
+
+  const interlinearization: Interlinearization = {
+    id: interlinearizationId,
+    sourceWritingSystem: '', // Paratext 9 doesn't specify source writing system in InterlinearData
+    analysisLanguages: [glossLanguage],
+    books: [analyzedBook],
+  };
+
+  return interlinearization;
+}
diff --git a/src/parsers/interlinearXmlParser.ts b/src/parsers/paratext-9/paratext9Parser.ts
similarity index 86%
rename from src/parsers/interlinearXmlParser.ts
rename to src/parsers/paratext-9/paratext9Parser.ts
index 7102b92..ce9372e 100644
--- a/src/parsers/interlinearXmlParser.ts
+++ b/src/parsers/paratext-9/paratext9Parser.ts
@@ -6,7 +6,7 @@ import type {
   StringRange,
   InterlinearData,
   VerseData,
-} from 'interlinearizer';
+} from 'paratext-9-types';
 
 /** Range: Index and Length attributes. */
 interface ParsedRange {
@@ -62,10 +62,8 @@ interface ParsedVersesItem {
   VerseData?: ParsedVerseData;
 }
 
-/** Root element: ScrTextName, GlossLanguage, BookId, Verses (with item[]). */
+/** Root element: GlossLanguage, BookId, Verses (with item[]). */
 interface ParsedInterlinearDataRoot {
-  /** Source text name (FXP attribute ScrTextName). */
-  ['@_ScrTextName']?: string;
   /** Gloss language (FXP attribute GlossLanguage). */
   ['@_GlossLanguage']?: string;
   /** Book id (FXP attribute BookId). */
@@ -95,7 +93,7 @@ function extractLexemesFromCluster(clusterElement: ParsedCluster): LexemeData[]
     if (!lexemeId) {
       throw new Error('Invalid XML: Lexeme missing required Id attribute');
     }
-    return { LexemeId: lexemeId, SenseId: el['@_GlossId'] ?? '' };
+    return { lexemeId, senseId: el['@_GlossId'] ?? '' };
   });
 }
 
@@ -122,9 +120,9 @@ function extractPunctuationsFromVerse(verseDataElement: ParsedVerseData): Punctu
     if (!Number.isFinite(index) || !Number.isFinite(length)) return [];
     return [
       {
-        TextRange: { Index: index, Length: length },
-        BeforeText: el.BeforeText ?? '',
-        AfterText: el.AfterText ?? '',
+        textRange: { index, length },
+        beforeText: el.BeforeText ?? '',
+        afterText: el.AfterText ?? '',
       },
     ];
   });
@@ -153,21 +151,21 @@ function extractClustersFromVerse(verseDataElement: ParsedVerseData): ClusterDat
       throw new Error('Invalid XML: Range missing required Index or Length attributes');
     }
 
-    const textRange: StringRange = { Index: index, Length: length };
+    const textRange: StringRange = { index, length };
     const lexemes = extractLexemesFromCluster(el);
 
     // Join with "/"; lexeme IDs may contain "/", so do not split LexemesId elsewhere.
-    const lexemesId = lexemes.map((l) => l.LexemeId).join('/');
+    const lexemesId = lexemes.map((l) => l.lexemeId).join('/');
     /** Cluster Id: LexemesId/Index-Length when lexemes present; Index-Length when none. */
     const id = lexemesId ? `${lexemesId}/${index}-${length}` : `${index}-${length}`;
     const excluded = el.Excluded === 'true';
 
     return {
-      TextRange: textRange,
-      Lexemes: lexemes,
-      LexemesId: lexemesId,
-      Id: id,
-      Excluded: excluded,
+      textRange,
+      lexemes,
+      lexemesId,
+      id,
+      excluded,
     };
   });
 }
@@ -179,7 +177,7 @@ function extractClustersFromVerse(verseDataElement: ParsedVerseData): ClusterDat
  * Output matches the types in `interlinearizer`; no extra conversion is done. Expects the
  * interlinear XML schema described in [pt9-xml.md](pt9-xml.md).
  */
-export class InterlinearXmlParser {
+export class Paratext9Parser {
   private readonly parser: XMLParser;
 
   /**
@@ -213,8 +211,8 @@ export class InterlinearXmlParser {
    * @param xml - Raw XML string (e.g. file contents). Must be valid interlinear XML with
    *   InterlinearData root, GlossLanguage and BookId attributes, and Verses containing item
    *   entries.
-   * @returns Parsed interlinear data: ScrTextName, GlossLanguage, BookId, and Verses (record of
-   *   verse key to {@link VerseData} with Hash, Clusters, Punctuations).
+   * @returns Parsed interlinear data: GlossLanguage, BookId, and Verses (record of verse key to
+   *   {@link VerseData} with Hash, Clusters, Punctuations).
    * @throws {Error} If the root element, required attributes (GlossLanguage, BookId), required
    *   structure (Verses, Cluster Range, Lexeme Id), or duplicate verse reference is present.
    */
@@ -225,7 +223,6 @@ export class InterlinearXmlParser {
       throw new Error('Invalid XML: Missing InterlinearData root element');
     }
 
-    const scrTextName = root['@_ScrTextName'] ?? '';
     const glossLanguage = root['@_GlossLanguage'] ?? '';
     const bookId = root['@_BookId'] ?? '';
     if (!glossLanguage || !bookId) {
@@ -251,23 +248,22 @@ export class InterlinearXmlParser {
 
       const verseDataElement = item.VerseData;
       if (!verseDataElement) {
-        acc[verseKey] = { Hash: '', Clusters: [], Punctuations: [] };
+        acc[verseKey] = { hash: '', clusters: [], punctuations: [] };
         return acc;
       }
 
       acc[verseKey] = {
-        Hash: verseDataElement['@_Hash'] ?? '',
-        Clusters: extractClustersFromVerse(verseDataElement),
-        Punctuations: extractPunctuationsFromVerse(verseDataElement),
+        hash: verseDataElement['@_Hash'] ?? '',
+        clusters: extractClustersFromVerse(verseDataElement),
+        punctuations: extractPunctuationsFromVerse(verseDataElement),
       };
       return acc;
     }, {});
 
     return {
-      ScrTextName: scrTextName,
-      GlossLanguage: glossLanguage,
-      BookId: bookId,
-      Verses: verses,
+      glossLanguage,
+      bookId,
+      verses,
     };
   }
 }
diff --git a/src/parsers/pt9-xml.md b/src/parsers/paratext-9/pt9-xml.md
similarity index 95%
rename from src/parsers/pt9-xml.md
rename to src/parsers/paratext-9/pt9-xml.md
index 56d0baa..7cb7caf 100644
--- a/src/parsers/pt9-xml.md
+++ b/src/parsers/paratext-9/pt9-xml.md
@@ -8,7 +8,6 @@ The extension reads PT9 interlinear data from XML files (e.g. `Interlinear_<lang
   - **Attributes:**
     - `GlossLanguage` (required): Language code or name for glosses (e.g. `"en"`).
     - `BookId` (required): Book id (e.g. `"MAT"`, `"RUT"`).
-    - `ScrTextName` (optional): Source text / project name.
   - **Child:** Exactly one `Verses` element.
 
 - **Verses**
@@ -44,7 +43,7 @@ The extension reads PT9 interlinear data from XML files (e.g. `Interlinear_<lang
 
 The parser produces objects conforming to the types in `src/types/interlinearizer.d.ts`:
 
-- **InterlinearData:** `ScrTextName`, `GlossLanguage`, `BookId`, `Verses` (record of verse key → **VerseData**).
+- **InterlinearData:** `GlossLanguage`, `BookId`, `Verses` (record of verse key → **VerseData**).
 - **VerseData:** `Hash`, `Clusters` (array of **ClusterData**), `Punctuations` (array of **PunctuationData**).
 - **ClusterData:** `TextRange` (`Index`, `Length`), `Lexemes` (array of `{ LexemeId, SenseId }`), `LexemesId` (slash-joined lexeme IDs), `Id` (cluster id: `LexemesId/Index-Length` or `Index-Length` when there are no lexemes), `Excluded` (boolean flag for location-specific exclusion).
 - **PunctuationData:** `TextRange`, `BeforeText`, `AfterText`.
@@ -73,7 +72,7 @@ This example shows optional root attributes, verse `Hash`, multiple verses and c
 
 ```xml
 <?xml version="1.0" encoding="utf-8"?>
-<InterlinearData ScrTextName="MyProject" GlossLanguage="en" BookId="RUT">
+<InterlinearData GlossLanguage="en" BookId="RUT">
   <Verses>
     <item>
       <string>RUT 1:1</string>
diff --git a/src/types/interlinearizer-enums.ts b/src/types/interlinearizer-enums.ts
new file mode 100644
index 0000000..5ea8052
--- /dev/null
+++ b/src/types/interlinearizer-enums.ts
@@ -0,0 +1,58 @@
+/**
+ * @file Runtime enum values for the interlinearizer model.
+ *
+ *   Type declarations (and these enums as types) live in interlinearizer.d.ts for the declared module
+ *   'interlinearizer'. This file provides the actual enum values so code that imports from this
+ *   path (e.g. parsers/converter) has runtime access. Keeps a single source of truth for enum
+ *   values and avoids duplicating them in test mocks.
+ */
+
+/** Whether an occurrence position holds a word or punctuation. */
+export enum OccurrenceType {
+  /** A word occurrence. */
+  Word = 'word',
+  /** A punctuation occurrence. */
+  Punctuation = 'punctuation',
+}
+
+/** The kind of linguistic analysis represented. */
+export enum AnalysisType {
+  /** Surface wordform only — no gloss or morpheme breakdown. */
+  Wordform = 'wordform',
+  /** Morpheme-level analysis with MorphemeBundles. */
+  Morph = 'morph',
+  /** Word-level gloss (no morpheme decomposition). */
+  Gloss = 'gloss',
+  /** Punctuation placeholder. */
+  Punctuation = 'punctuation',
+}
+
+/**
+ * How the analysis was produced.
+ *
+ * - `high`
+ * - `medium`
+ * - `low`
+ * - `guess`
+ */
+export enum Confidence {
+  Guess = 'guess',
+  Low = 'low',
+  Medium = 'medium',
+  High = 'high',
+}
+
+/**
+ * Lifecycle status of an assignment or alignment link.
+ *
+ * - `approved` — human-confirmed.
+ * - `suggested` — machine-generated or unreviewed.
+ * - `candidate` — proposed but not yet reviewed.
+ * - `rejected` — explicitly rejected by a human.
+ */
+export enum AssignmentStatus {
+  Approved = 'approved',
+  Suggested = 'suggested',
+  Candidate = 'candidate',
+  Rejected = 'rejected',
+}
diff --git a/src/types/interlinearizer.d.ts b/src/types/interlinearizer.d.ts
index 75736ff..2bcd6f7 100644
--- a/src/types/interlinearizer.d.ts
+++ b/src/types/interlinearizer.d.ts
@@ -2,74 +2,483 @@
  * @file Extension type declaration file. Platform.Bible shares this with other extensions. Types
  *   exposed here (and in papi-shared-types) are available to other extensions.
  */
+
 /**
- * Interlinear types (InterlinearData, VerseData, ClusterData, etc.) are the public API for
- * interlinear data. The XML parser in src/parsers/interlinearXmlParser.ts consumes raw
- * fast-xml-parser output internally and returns objects conforming to these types.
+ * Interlinearizer Interlinear Model
+ *
+ * A representation for interlinear data that should cover import from LCM (FieldWorks), Paratext 9,
+ * and BT Extension and support the new interlinearizer
  */
 declare module 'interlinearizer' {
-  /** Character range in source text (Index, Length). */
-  export interface StringRange {
-    /** Start index of the range in the source text (0-based). */
-    Index: number;
-    /** Number of characters in the range. */
-    Length: number;
+  // ---------------------------------------------------------------------------
+  // Enums
+  // ---------------------------------------------------------------------------
+
+  /** Whether an occurrence position holds a word or punctuation. */
+  export enum OccurrenceType {
+    /** A word occurrence. */
+    Word = 'word',
+    /** A punctuation occurrence. */
+    Punctuation = 'punctuation',
+  }
+
+  /** The kind of linguistic analysis represented. */
+  export enum AnalysisType {
+    /** Surface wordform only — no gloss or morpheme breakdown. */
+    Wordform = 'wordform',
+    /** Morpheme-level analysis with MorphemeBundles. */
+    Morph = 'morph',
+    /** Word-level gloss (no morpheme decomposition). */
+    Gloss = 'gloss',
+    /** Punctuation placeholder. */
+    Punctuation = 'punctuation',
+  }
+
+  /**
+   * How the analysis was produced.
+   *
+   * - `high`
+   * - `medium`
+   * - `low`
+   * - `guess`
+   */
+  export enum Confidence {
+    Guess = 'guess',
+    Low = 'low',
+    Medium = 'medium',
+    High = 'high',
   }
 
-  /** Data on the interlinearization of a single lexeme. */
-  export interface LexemeData {
-    /** ID of the lexeme (e.g. from Lexicon; XML attribute Id). */
-    LexemeId: string;
-    /** ID of the sense/gloss used for this lexeme (XML attribute GlossId). */
-    SenseId: string;
+  /**
+   * Lifecycle status of an assignment or alignment link.
+   *
+   * - `approved` — human-confirmed.
+   * - `suggested` — machine-generated or unreviewed.
+   * - `candidate` — proposed but not yet reviewed.
+   * - `rejected` — explicitly rejected by a human.
+   */
+  export enum AssignmentStatus {
+    Approved = 'approved',
+    Suggested = 'suggested',
+    Candidate = 'candidate',
+    Rejected = 'rejected',
   }
 
-  /** Data on the interlinearization of a cluster. */
-  export interface ClusterData {
-    /** Character range this cluster occupies in the verse text. */
-    TextRange: StringRange;
-    /** Lexemes in this cluster, in order. */
-    Lexemes: LexemeData[];
-    /** Slash-joined LexemeIds for this cluster (e.g. "Word:a/Word:b"). */
-    LexemesId: string;
-    /** Unique cluster id: LexemesId plus TextRange (e.g. "Word:a/Word:b/21-3"). */
-    Id: string;
-    /** Excluded flag. See [pt9-xml.md](../parsers/pt9-xml.md) for details. */
-    Excluded: boolean;
+  // ---------------------------------------------------------------------------
+  // §1.1 Interlinearization
+  // ---------------------------------------------------------------------------
+
+  /**
+   * Top-level container for all interlinear data.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: one `IScripture` instance (singleton per project).
+   * - Paratext: merged from per-book, per-language `InterlinearData` files.
+   * - BT Extension: one `Translation` (project scope).
+   */
+  export interface Interlinearization {
+    id: string;
+
+    /** Writing system of the source text being analyzed. */
+    sourceWritingSystem: string;
+
+    /**
+     * Writing systems in which analyses are provided (e.g. `["en", "fr"]`). A single interlinear
+     * can hold analyses in multiple languages.
+     */
+    analysisLanguages: string[];
+
+    /** Books of scripture (or other texts) that have been analyzed. */
+    books: AnalyzedBook[];
   }
 
-  /** Data on punctuation change. */
-  export interface PunctuationData {
-    /** Character range this punctuation occupies in the verse text. */
-    TextRange: StringRange;
-    /** Punctuation text before the change (or empty). */
-    BeforeText: string;
-    /** Punctuation text after the change (or empty). */
-    AfterText: string;
+  // ---------------------------------------------------------------------------
+  // §1.2 AnalyzedBook
+  // ---------------------------------------------------------------------------
+
+  /**
+   * One book of scripture (or other text unit) analyzed within an Interlinear.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: `IScrBook`. `bookRef` = `BookId` (3-letter SIL code).
+   * - Paratext: book-level `InterlinearData` (merged across languages).
+   * - BT Extension: one book within a `Translation`.
+   */
+  export interface AnalyzedBook {
+    id: string;
+
+    /** Book identifier (e.g. `"GEN"`, `"MAT"`). */
+    bookRef: string;
+
+    /**
+     * Hash or version stamp of the source text at analysis time. Used to detect when the underlying
+     * text has changed and analyses may be stale.
+     */
+    textVersion: string;
+
+    /** Ordered segments that compose this book. */
+    segments: Segment[];
+  }
+
+  // ---------------------------------------------------------------------------
+  // §1.3 Segment
+  // ---------------------------------------------------------------------------
+
+  /**
+   * A sentence, clause, or verse — the unit within which occurrences are ordered.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: `ISegment` owned by `IScrTxtPara` within `IScrSection`.
+   * - Paratext: a verse (`VerseRef`) within `VerseData`.
+   * - BT Extension: a `Verse` (BCV identifier).
+   */
+  export interface Segment {
+    id: string;
+
+    /** Canonical reference (e.g. verse reference, paragraph index + offset range). */
+    segmentRef: string;
+
+    /** Raw text of the segment, for display and validation. */
+    baselineText?: string;
+
+    /** Idiomatic translation of the segment. */
+    freeTranslation?: MultiString;
+
+    /** Word-for-word translation. */
+    literalTranslation?: MultiString;
+
+    /** Ordered word / punctuation tokens in this segment. */
+    occurrences: Occurrence[];
   }
 
-  /** Interlinear data for a single verse. */
-  export interface VerseData {
-    /** Hash of verse text when approved; empty string if not approved. */
-    Hash: string;
-    /** Lexeme clusters in this verse. */
-    Clusters: ClusterData[];
-    /** Punctuation changes in this verse. */
-    Punctuations: PunctuationData[];
+  /** A string value keyed by writing-system tag. */
+  export type MultiString = Record<string, string>;
+
+  // ---------------------------------------------------------------------------
+  // §1.4 Occurrence
+  // ---------------------------------------------------------------------------
+
+  /**
+   * A single word or punctuation token at a specific position in the text. Inherits its text
+   * version from the parent AnalyzedBook.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: entry in `ISegment.AnalysesRS` at a given index.
+   * - Paratext: `ClusterData` within `VerseData`.
+   * - BT Extension: `Token` (API) / `Instance` (DB).
+   */
+  export interface Occurrence {
+    id: string;
+
+    /** Parent segment. */
+    segmentId: string;
+
+    /** Zero-based position within the segment (preserves word order). */
+    index: number;
+
+    /**
+     * Positional anchor in the source text. Supports BCVWP, BCVWP+partNum, StringRange, or
+     * character offset depending on source system.
+     */
+    anchor: string;
+
+    /** The text as it appears in the source. */
+    surfaceText: string;
+
+    /** Writing system of `surfaceText`. */
+    writingSystem: string;
+
+    type: OccurrenceType;
+
+    /** All analysis assignments for this occurrence (zero or more). */
+    assignments: AnalysisAssignment[];
   }
 
-  /** Root interlinear data: book + verses. */
-  export interface InterlinearData {
-    /** Source text / project name (e.g. from InterlinearData ScrTextName attribute). */
-    ScrTextName: string;
-    /** Language code or name for the glosses. */
-    GlossLanguage: string;
-    /** Book id (e.g. "RUT", "MAT"). */
-    BookId: string;
+  // ---------------------------------------------------------------------------
+  // §1.5 Analysis
+  // ---------------------------------------------------------------------------
+
+  /**
+   * A reusable analysis describing a linguistic interpretation of a word. The same analysis can be
+   * assigned to many occurrences.
+   *
+   * Confidence and provenance belong to the analysis itself because they describe how the
+   * interpretation was produced.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: `IWfiAnalysis` (morph), `IWfiGloss` (gloss), or bare `IWfiWordform` (wordform).
+   * - Paratext: `LexemeCluster` + `WordAnalysis`.
+   * - BT Extension: synthesized from `Token.gloss` / `lemmaText` / `senseIds`. Requires deduplication
+   *   — BT Extension stores gloss/sense per-token, not as shared analysis objects.
+   */
+  export interface Analysis {
+    id: string;
+
+    /** Writing system of the analysis (e.g. the gloss language). */
+    analysisLanguage: string;
+
+    analysisType: AnalysisType;
+
+    confidence: Confidence;
+
+    /** System that produced the analysis (e.g. "lcm", "paratext"). */
+    sourceSystem: string;
+
+    /**
+     * User or automation identifier within the source system (e.g. "jsmith", "parser-v3",
+     * "auto-glosser"). Use a stable automation ID when no human directly applied the analysis.
+     */
+    sourceUser: string;
+
+    /** Word-level gloss text. */
+    glossText?: string;
+
+    /** Part of speech. */
+    pos?: string;
+
+    /** Morphosyntactic feature structure. */
+    features?: Record<string, unknown>;
+
+    /** Ordered morpheme breakdown, when analysis is at the morpheme level (`analysisType = morph`). */
+    morphemeBundles?: MorphemeBundle[];
+  }
+
+  // ---------------------------------------------------------------------------
+  // §1.6 AnalysisAssignment
+  // ---------------------------------------------------------------------------
+
+  /**
+   * The join between an occurrence and an analysis. Multiple assignments per occurrence enable
+   * competing analyses.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: `ISegment.AnalysesRS[i]` referencing `IWfiGloss` or `IWfiAnalysis`.
+   * - Paratext: `ClusterData` with selected `LexemeData`.
+   * - BT Extension: `Token` linked to senses (`senseIds`). Status inferred from
+   *   `Instance.termStatusNum` (BiblicalTermStatus enum).
+   */
+  export interface AnalysisAssignment {
+    id: string;
+
+    /** The occurrence being analyzed. */
+    occurrenceId: string;
+
+    /** The analysis applied. */
+    analysisId: string;
+
+    /** Whether a human has confirmed this analysis for this occurrence. */
+    status: AssignmentStatus;
+
+    /** Timestamp of when the assignment was made. */
+    createdAt?: string;
+  }
+
+  // ---------------------------------------------------------------------------
+  // §1.7 MorphemeBundle
+  // ---------------------------------------------------------------------------
+
+  /**
+   * An ordered morpheme within a morpheme-level analysis, linking to the lexicon.
+   *
+   * The four optional lexicon references mirror LCM's `IWfiMorphBundle` three-way link plus the
+   * owning entry:
+   *
+   * `allomorphRef` → `IMoForm` (which surface form / allomorph) `lexemeRef` → `ILexEntry` (owning
+   * dictionary entry) `senseRef` → `ILexSense` (which meaning) `grammarRef` → `IMoMorphSynAnalysis`
+   * (grammatical behaviour)
+   *
+   * In LCM an `ILexEntry` owns one _LexemeForm_ (the elsewhere / citation allomorph) and
+   * zero-or-more _AlternateForms_ — both are `IMoForm`. `allomorphRef` identifies the specific
+   * `IMoForm` matched in this context; `lexemeRef` identifies the entry that owns it.
+   *
+   * `form` vs `allomorphRef` — `form` is the surface text of the morpheme as it appeared in this
+   * specific analysis context. `allomorphRef` is a reference (ID) to the canonical allomorph object
+   * in the lexicon. These can legitimately differ: in LCM `IWfiMorphBundle.Form` may reflect
+   * phonological conditioning that differs from the canonical `IMoForm.Form`. When `allomorphRef`
+   * is absent, `form` is the only record of the morpheme shape.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: `IWfiMorphBundle` (1:1). `allomorphRef` = GUID of `IWfiMorphBundle.MorphRA` (`IMoForm`).
+   *   `lexemeRef` = GUID of the `ILexEntry` that owns that `IMoForm` (via `LexemeFormOA` or
+   *   `AlternateFormsOS`).
+   * - Paratext: each `Lexeme` within a `WordAnalysis`. Paratext's built-in XML lexicon has no
+   *   allomorph concept distinct from the entry — `Lexeme.AlternateForms` exists in the interface
+   *   but returns empty. `allomorphRef` is therefore omitted for the built-in lexicon. When an
+   *   integrated provider (e.g. FLEx via `IntegratedLexicalProvider`) is active, `AllomorphEntry`
+   *   surfaces actual allomorphs and `allomorphRef` can be populated. `lexemeRef` = `Lexeme.Id`
+   *   (LexemeKey-derived).
+   * - BT Extension: not natively modeled as morpheme bundles. A whole-word bundle can be synthesized:
+   *   `form` = `Token.text`, `allomorphRef` = `headwordId` (the BT Extension "morph" concept
+   *   corresponds to the FieldWorks Allomorph; the HeadWord's lemma is the elsewhere / LexemeForm
+   *   allomorph), `lexemeRef` = `headwordId`, `senseRef` = `senseIds[0]`. Macula TSV `morph` field
+   *   can supply the specific allomorphic form when it differs from the lemma.
+   */
+  export interface MorphemeBundle {
+    id: string;
+
+    /** Zero-based position within the analysis (preserves morpheme order). */
+    index: number;
+
+    /** The morpheme form as it appears in this analysis (surface text). */
+    form: string;
+
+    /** Writing system of `form`. */
+    writingSystem: string;
+
+    /**
+     * Reference to a specific Allomorph (`IMoForm`) in the lexical model.
+     *
+     * An `ILexEntry` in LCM owns one _LexemeForm_ (the elsewhere / citation allomorph) and
+     * zero-or-more _AlternateForms_. This field identifies which allomorph was matched in this
+     * morpheme position.
+     *
+     * In the BT Extension the "morph" concept aligns with this field: the HeadWord's lemma acts as
+     * the LexemeForm (elsewhere allomorph).
+     */
+    allomorphRef?: string;
+
+    /** Reference to Lexeme (`ILexEntry`) in the lexical model. */
+    lexemeRef?: string;
+
+    /** Reference to Sense (`ILexSense`) in the lexical model. */
+    senseRef?: string;
+
+    /** Reference to Grammar / MSA (`IMoMorphSynAnalysis`) in the lexical model. */
+    grammarRef?: string;
+  }
+
+  // ---------------------------------------------------------------------------
+  // §1.8 InterlinearAlignment
+  // ---------------------------------------------------------------------------
+
+  /**
+   * A project pairing a source-language interlinearization and a target-language interlinear with
+   * morph-level alignment links between them.
+   *
+   * Both interlinearizations carry their own analyzed books, segments, occurrences, and analyses.
+   * AlignmentLinks bridge the two, connecting individual morphemes (MorphemeBundles) or whole
+   * unanalyzed words (Occurrences) across the language boundary.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: LCM has no native alignment or bilingual pairing model. An InterlinearAlignment is
+   *   constructed by pairing a Scripture- based interlinearization (vernacular) with a source-text
+   *   interlinearization produced externally (e.g. Greek/Hebrew resource text).
+   * - Paratext: not directly represented. Can be constructed from parallel projects that share the
+   *   same versification.
+   * - BT Extension: one `Translation` scoped to source + target sides (`Translation.sideNum`: 1 =
+   *   source, 2 = target). Each side becomes an `Interlinearization`. `Alignment` records become
+   *   `AlignmentLink`s.
+   */
+  export interface InterlinearAlignment {
+    id: string;
+
+    /** The source-language interlinearization (e.g. Greek / Hebrew). */
+    source: Interlinearization;
+
+    /** The target-language interlinearization (e.g. vernacular translation). */
+    target: Interlinearization;
+
+    /**
+     * Morph-level alignment links connecting endpoints in the source interlinear to endpoints in
+     * the target interlinear.
+     */
+    links: AlignmentLink[];
+  }
+
+  // ---------------------------------------------------------------------------
+  // §1.9 AlignmentLink
+  // ---------------------------------------------------------------------------
+
+  /**
+   * A directional alignment link from one or more source-text morphemes / words to one or more
+   * target-text morphemes / words.
+   *
+   * Each endpoint resolves to either:
+   *
+   * - A specific MorphemeBundle within a fully analyzed occurrence, connecting at the allomorph level
+   *   (via `allomorphRef`).
+   * - A whole unanalyzed occurrence, when no morpheme-level analysis exists.
+   *
+   * Typical workflow: the user selects a morph from the source-text interlinear and connects it to
+   * an allomorph of a fully analyzed occurrence in the target-text interlinear — or to an
+   * unanalyzed occurrence if the target word has not yet been broken into morphemes.
+   *
+   * Source-system mapping:
+   *
+   * - LCM: no native alignment model; links are produced by external tools.
+   * - Paratext: not stored in interlinear data; derivable from parallel interlinear selections when
+   *   two projects share versification.
+   * - BT Extension: `Alignment` entity. Each `Alignment` record with `sourceInstances` /
+   *   `targetInstances` is decomposed into `AlignmentEndpoint`s — one per instance. BT Extension's
+   *   "morph" concept (the token's morphological form) maps to a MorphemeBundle-level endpoint when
+   *   a morpheme analysis is present; otherwise the endpoint targets the whole occurrence. `status`
+   *   from `statusNum` via BT Extension's `AlignmentStatus` enum (CREATED=0, REJECTED=1,
+   *   APPROVED=2, NEEDS_REVIEW=3) — lossy mapping where both CREATED and NEEDS_REVIEW collapse to
+   *   `candidate`. `origin` from `originNum` — an undocumented integer with no enum; descriptive
+   *   strings must be defined externally. Eflomal-generated alignments leave `originNum` and
+   *   `statusNum` unset, so both default to 0 (`CREATED`).
+   */
+  export interface AlignmentLink {
+    id: string;
+
+    /** Source-side endpoints (one or more morphemes / words from the source interlinear). */
+    sourceEndpoints: AlignmentEndpoint[];
+
+    /** Target-side endpoints (one or more morphemes / words from the target interlinear). */
+    targetEndpoints: AlignmentEndpoint[];
+
+    status: AssignmentStatus;
+
+    /** How the alignment was created (manual, automatic tool, etc.). */
+    origin?: string;
+
+    /**
+     * Confidence in this alignment link, independent of the confidence on the analyses at each
+     * endpoint.
+     */
+    confidence?: Confidence;
+
+    /** Multilingual notes keyed by writing system (e.g. UI locale). */
+    notes?: MultiString;
+  }
+
+  // ---------------------------------------------------------------------------
+  // §1.10 AlignmentEndpoint
+  // ---------------------------------------------------------------------------
+
+  /**
+   * One side of an alignment link, identifying a precise point of connection within an interlinear
+   * text.
+   *
+   * When the referenced occurrence has a morpheme-level analysis, `bundleId` identifies the
+   * specific MorphemeBundle — and by extension its `allomorphRef` (IMoForm), `lexemeRef`
+   * (ILexEntry), `senseRef` (ILexSense), and `grammarRef` (IMoMorphSynAnalysis).
+   *
+   * When the occurrence is unanalyzed, `bundleId` is absent and the link targets the whole word.
+   *
+   * Resolution chain (fully analyzed): AlignmentEndpoint → Occurrence → AnalysisAssignment →
+   * Analysis → MorphemeBundle → allomorphRef (IMoForm) → lexemeRef (ILexEntry) → senseRef
+   * (ILexSense) → grammarRef (IMoMorphSynAnalysis)
+   *
+   * Resolution chain (unanalyzed): AlignmentEndpoint → Occurrence → surfaceText only
+   */
+  export interface AlignmentEndpoint {
+    /** The word or punctuation occurrence in the text. */
+    occurrenceId: string;
+
     /**
-     * Verse data keyed by verse reference (e.g. "RUT 3:1"). Exactly one entry per reference; the
-     * parser rejects XML that contains duplicate verse references.
+     * Identifies a specific MorphemeBundle within one of the occurrence's analyses. When set, the
+     * alignment connects at the allomorph / morpheme level. When absent, the alignment connects to
+     * the whole (unanalyzed) occurrence.
      */
-    Verses: Record<string, VerseData>;
+    bundleId?: string;
   }
 }
diff --git a/tsconfig.json b/tsconfig.json
index 6a9ab66..53a54d9 100644
--- a/tsconfig.json
+++ b/tsconfig.json
@@ -57,10 +57,11 @@
     "sourceMap": true,
     // We need a baseurl for webpack's tsconfig path aliases plugin
     "baseUrl": "./",
-    /** Paths for src-rooted imports (e.g. in src/__tests__ use "parsers/..." or "main" instead of "../../parsers/..."). */
+    /** Paths for src-rooted imports (e.g. in src/__tests__ use "parsers/..." or "types/..." instead of relative paths). */
     "paths": {
       "@main": ["src/main"],
-      "parsers/*": ["src/parsers/*"]
+      "parsers/*": ["src/parsers/*"],
+      "types/*": ["src/types/*"]
     },
     "noUnusedLocals": true,
     "noUnusedParameters": true,

From 00e321b28329d96d351e2ef2ce0b6853f2808c85 Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Thu, 19 Feb 2026 15:11:01 -0700
Subject: [PATCH 2/8] Enhance interlinearizer WebView with analyses view and
 update tests

- Add support for a new JSON view mode displaying analyses derived from parsed data.
- Implement functions to describe and label the new view mode.
- Update the WebView component to include a button for switching to the analyses view.
- Modify tests to cover the new analyses functionality and ensure proper rendering.
- Refactor the `createAnalyses` function to generate analysis maps from interlinear data.
---
 .../interlinearizer.web-view.test.tsx         |  35 ++-
 .../paratext-9/paratext9Converter.test.ts     | 218 +++++++++++++++++-
 src/interlinearizer.web-view.tsx              |  68 ++++--
 src/parsers/paratext-9/paratext-9-types.ts    |   2 +-
 src/parsers/paratext-9/paratext9Converter.ts  |   8 +-
 5 files changed, 302 insertions(+), 29 deletions(-)

diff --git a/src/__tests__/interlinearizer.web-view.test.tsx b/src/__tests__/interlinearizer.web-view.test.tsx
index 67cc843..7b25c59 100644
--- a/src/__tests__/interlinearizer.web-view.test.tsx
+++ b/src/__tests__/interlinearizer.web-view.test.tsx
@@ -25,6 +25,23 @@ const stubInterlinearization = {
 const mockParse = jest.fn().mockReturnValue(stubInterlinearData);
 const mockConvert = jest.fn().mockReturnValue(stubInterlinearization);
 
+/** Stub analyses map for Analyses view (ID → Analysis). */
+const stubAnalysesMap = new Map([
+  [
+    'analysis-en-lex1-s1',
+    {
+      id: 'analysis-en-lex1-s1',
+      analysisLanguage: 'en',
+      analysisType: 'gloss',
+      confidence: 'medium',
+      sourceSystem: 'paratext-9',
+      sourceUser: 'paratext-9-parser',
+      glossText: 'sense1',
+    },
+  ],
+]);
+const mockCreateAnalyses = jest.fn().mockReturnValue(stubAnalysesMap);
+
 /** Mock parser: no real XML parsing; returns stub data. Parser/converter are tested elsewhere. */
 jest.mock('parsers/paratext-9/paratext9Parser', () => ({
   Paratext9Parser: jest.fn().mockImplementation(() => ({
@@ -32,9 +49,10 @@ jest.mock('parsers/paratext-9/paratext9Parser', () => ({
   })),
 }));
 
-/** Mock converter: no real conversion; returns stub Interlinearization. */
+/** Mock converter: no real conversion; returns stub Interlinearization and stub analyses map. */
 jest.mock('parsers/paratext-9/paratext9Converter', () => ({
   convertParatext9ToInterlinearization: mockConvert,
+  createAnalyses: mockCreateAnalyses,
 }));
 
 /**
@@ -86,13 +104,14 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/test-data\/Interlinear_en_MAT\.xml/i)).toBeInTheDocument();
   });
 
-  it('renders the JSON view mode switch (InterlinearData / Interlinearization)', () => {
+  it('renders the JSON view mode switch (InterlinearData / Interlinearization / Analyses)', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
     const group = screen.getByRole('group', { name: /json view mode/i });
     expect(group).toBeInTheDocument();
     expect(screen.getByRole('button', { name: /^interlineardata$/i })).toBeInTheDocument();
     expect(screen.getByRole('button', { name: /^interlinearization$/i })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /^analyses$/i })).toBeInTheDocument();
     expect(screen.getByText(/view json as:/i)).toBeInTheDocument();
   });
 
@@ -152,6 +171,18 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/bookId/i)).toBeInTheDocument();
   });
 
+  it('switching to Analyses shows analysis map JSON from test data', () => {
+    render(<InterlinearizerWebView {...testWebViewProps} />);
+
+    fireEvent.click(screen.getByRole('button', { name: /^analyses$/i }));
+
+    expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
+    expect(mockCreateAnalyses).toHaveBeenCalledWith(stubInterlinearData);
+    expect(screen.getByText(/analysis-en-lex1-s1/)).toBeInTheDocument();
+    expect(screen.getByText(/glossText/i)).toBeInTheDocument();
+    expect(screen.getByText(/paratext-9/i)).toBeInTheDocument();
+  });
+
   it('renders empty JSON pre when jsonToShow is undefined (converter returns undefined)', () => {
     mockConvert.mockReturnValueOnce(undefined);
 
diff --git a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
index 7a86cdf..f8a2600 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
@@ -1,8 +1,11 @@
-/** @file Unit tests for {@link convertParatext9ToInterlinearization}. */
+/** @file Unit tests for {@link convertParatext9ToInterlinearization} and {@link createAnalyses}. */
 /// <reference types="jest" />
 
 import type { InterlinearData } from 'paratext-9-types';
-import { convertParatext9ToInterlinearization } from 'parsers/paratext-9/paratext9Converter';
+import {
+  convertParatext9ToInterlinearization,
+  createAnalyses,
+} from 'parsers/paratext-9/paratext9Converter';
 
 describe('convertParatext9ToInterlinearization', () => {
   describe('top-level structure', () => {
@@ -428,4 +431,215 @@ describe('convertParatext9ToInterlinearization', () => {
       expect(result.books[0].segments[0].occurrences[0].id).toBe(`${segId}-occ-0-Word:word/0-4`);
     });
   });
+
+  describe('createAnalyses', () => {
+    it('returns empty Map when verses is empty', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {},
+      };
+      const result = createAnalyses(data);
+
+      expect(result).toBeInstanceOf(Map);
+      expect(result.size).toBe(0);
+    });
+
+    it('returns one Analysis for one verse with one cluster and one lexeme', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [{ lexemeId: 'Word:hello', senseId: 'g1' }],
+                lexemesId: 'Word:hello',
+                id: 'Word:hello/0-4',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = createAnalyses(data);
+
+      expect(result.size).toBe(1);
+      const analysis = result.get('analysis-en-Word:hello-g1');
+      expect(analysis).toBeDefined();
+      expect(analysis?.id).toBe('analysis-en-Word:hello-g1');
+      expect(analysis?.analysisLanguage).toBe('en');
+      expect(analysis?.analysisType).toBe('gloss');
+      expect(analysis?.confidence).toBe('medium');
+      expect(analysis?.sourceSystem).toBe('paratext-9');
+      expect(analysis?.sourceUser).toBe('paratext-9-parser');
+      expect(analysis?.glossText).toBe('g1');
+    });
+
+    it('deduplicates: same lexeme in multiple clusters yields one analysis', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 3 },
+                lexemes: [{ lexemeId: 'Word:the', senseId: 'def' }],
+                lexemesId: 'Word:the',
+                id: 'c1',
+                excluded: false,
+              },
+              {
+                textRange: { index: 4, length: 3 },
+                lexemes: [{ lexemeId: 'Word:the', senseId: 'def' }],
+                lexemesId: 'Word:the',
+                id: 'c2',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = createAnalyses(data);
+
+      expect(result.size).toBe(1);
+      expect(result.has('analysis-en-Word:the-def')).toBe(true);
+    });
+
+    it('returns multiple analyses for different lexemes (lexemeId or senseId)', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 4 },
+                lexemes: [
+                  { lexemeId: 'Stem:run', senseId: 'g1' },
+                  { lexemeId: 'Suffix:ing', senseId: 'g2' },
+                ],
+                lexemesId: 'Stem:run',
+                id: 'cluster1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = createAnalyses(data);
+
+      expect(result.size).toBe(2);
+      expect(result.has('analysis-en-Stem:run-g1')).toBe(true);
+      expect(result.has('analysis-en-Suffix:ing-g2')).toBe(true);
+      expect(result.get('analysis-en-Stem:run-g1')?.glossText).toBe('g1');
+      expect(result.get('analysis-en-Suffix:ing-g2')?.glossText).toBe('g2');
+    });
+
+    it('sets glossText to undefined when senseId is empty', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 1 },
+                lexemes: [{ lexemeId: 'Word:a', senseId: '' }],
+                lexemesId: 'Word:a',
+                id: 'Word:a/0-1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = createAnalyses(data);
+
+      expect(result.size).toBe(1);
+      const analysis = result.get('analysis-en-Word:a');
+      expect(analysis).toBeDefined();
+      expect(analysis?.glossText).toBeUndefined();
+      expect(analysis?.id).toBe('analysis-en-Word:a');
+    });
+
+    it('uses glossLanguage from interlinearData for analysisLanguage and id prefix', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'fr',
+        bookId: 'GEN',
+        verses: {
+          'GEN 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 2 },
+                lexemes: [{ lexemeId: 'Word:au', senseId: 'sens1' }],
+                lexemesId: 'Word:au',
+                id: 'c1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = createAnalyses(data);
+
+      expect(result.size).toBe(1);
+      const analysis = result.get('analysis-fr-Word:au-sens1');
+      expect(analysis).toBeDefined();
+      expect(analysis?.analysisLanguage).toBe('fr');
+      expect(analysis?.id).toBe('analysis-fr-Word:au-sens1');
+    });
+
+    it('includes analyses from all verses', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 3 },
+                lexemes: [{ lexemeId: 'Word:one', senseId: 's1' }],
+                lexemesId: 'Word:one',
+                id: 'c1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+          'MAT 1:2': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 3 },
+                lexemes: [{ lexemeId: 'Word:two', senseId: 's2' }],
+                lexemesId: 'Word:two',
+                id: 'c2',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const result = createAnalyses(data);
+
+      expect(result.size).toBe(2);
+      expect(result.has('analysis-en-Word:one-s1')).toBe(true);
+      expect(result.has('analysis-en-Word:two-s2')).toBe(true);
+    });
+  });
 });
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index 4d1a14d..b3808ba 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -1,7 +1,10 @@
 import { useMemo, useState } from 'react';
 import type { InterlinearData } from 'paratext-9-types';
-import { Paratext9Parser } from './parsers/paratext-9/paratext9Parser';
-import { convertParatext9ToInterlinearization } from './parsers/paratext-9/paratext9Converter';
+import { Paratext9Parser } from 'parsers/paratext-9/paratext9Parser';
+import {
+  convertParatext9ToInterlinearization,
+  createAnalyses,
+} from 'parsers/paratext-9/paratext9Converter';
 
 /** Test interlinear XML bundled at build time (from test-data/Interlinear_en_MAT.xml). */
 import testXml from '../test-data/Interlinear_en_MAT.xml?raw';
@@ -9,16 +12,30 @@ import testXml from '../test-data/Interlinear_en_MAT.xml?raw';
 /** Result of parsing the bundled test XML: either data or an error message. */
 type ParseResult = { data: InterlinearData; error: undefined } | { data: undefined; error: string };
 
-/** View mode for the JSON display: raw PT9 structure or converted interlinearizer model. */
-type JsonViewMode = 'interlinear-data' | 'interlinearization';
+/** View mode for the JSON display: raw PT9, converted model, or analyses map. */
+type JsonViewMode = 'interlinear-data' | 'interlinearization' | 'analyses';
+
+function getViewModeDescription(mode: JsonViewMode): string {
+  if (mode === 'interlinear-data') return 'Paratext 9 book/verse/cluster structure.';
+  if (mode === 'interlinearization')
+    return 'Converted interlinearizer book/segment/occurrence model.';
+  return 'Analysis objects (ID → gloss, confidence, source) from test data.';
+}
+
+function getViewModeLabel(mode: JsonViewMode): string {
+  if (mode === 'interlinear-data') return 'InterlinearData (JSON):';
+  if (mode === 'interlinearization') return 'Interlinearization (JSON):';
+  return 'Analyses (JSON):';
+}
 
 /**
  * Main interlinearizer WebView. Parses the bundled test XML into the interlinear model and displays
  * the result as raw JSON. No PAPI commands or file loading—everything is self-contained.
  *
- * A switch lets the user choose between viewing {@link InterlinearData} (Paratext 9 format) or
- * {@link Interlinearization} (converted interlinearizer model). Parser is created inside useMemo so
- * parsing runs once per mount.
+ * A switch lets the user choose between: {@link InterlinearData} (Paratext 9 format),
+ * {@link Interlinearization} (converted interlinearizer model), or Analyses (ID → Analysis map
+ * derived from test data: gloss, confidence, source). Parser is created inside useMemo so parsing
+ * runs once per mount.
  */
 globalThis.webViewComponent = function InterlinearizerWebView() {
   const [jsonViewMode, setJsonViewMode] = useState<JsonViewMode>('interlinear-data');
@@ -38,8 +55,19 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
     [parsed],
   );
 
-  /** In Interlinearization mode use converted data (may be undefined); otherwise use parsed. */
-  const jsonToShow = jsonViewMode === 'interlinearization' ? interlinearization : parsed;
+  /** Analyses map derived from parsed data (ID → Analysis); only defined when parsed exists. */
+  const analysesMap = useMemo(() => (parsed ? createAnalyses(parsed) : undefined), [parsed]);
+
+  /** Data to show as JSON: depends on selected view mode. */
+  const jsonToShow = (():
+    | typeof parsed
+    | ReturnType<typeof convertParatext9ToInterlinearization>
+    | Record<string, unknown>
+    | undefined => {
+    if (jsonViewMode === 'interlinearization') return interlinearization;
+    if (jsonViewMode === 'analyses' && analysesMap) return Object.fromEntries(analysesMap);
+    return parsed;
+  })();
 
   return (
     <div className="tw-flex tw-flex-col tw-gap-4 tw-p-6">
@@ -90,18 +118,24 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
               >
                 Interlinearization
               </button>
+              <button
+                type="button"
+                onClick={() => setJsonViewMode('analyses')}
+                className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
+                  jsonViewMode === 'analyses'
+                    ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
+                    : 'tw-text-muted-foreground hover:tw-text-foreground'
+                }`}
+                aria-pressed={jsonViewMode === 'analyses'}
+              >
+                Analyses
+              </button>
             </div>
             <p className="tw-text-xs tw-text-muted-foreground">
-              {jsonViewMode === 'interlinear-data'
-                ? 'Paratext 9 book/verse/cluster structure.'
-                : 'Converted interlinearizer book/segment/occurrence model.'}
+              {getViewModeDescription(jsonViewMode)}
             </p>
           </div>
-          <p className="tw-text-sm tw-text-muted-foreground">
-            {jsonViewMode === 'interlinear-data'
-              ? 'InterlinearData (JSON):'
-              : 'Interlinearization (JSON):'}
-          </p>
+          <p className="tw-text-sm tw-text-muted-foreground">{getViewModeLabel(jsonViewMode)}</p>
           <pre className="tw-overflow-auto tw-rounded-md tw-border tw-border-border tw-bg-muted tw-p-4 tw-text-sm tw-font-mono tw-leading-relaxed">
             {jsonToShow ? JSON.stringify(jsonToShow, undefined, 2) : ''}
           </pre>
diff --git a/src/parsers/paratext-9/paratext-9-types.ts b/src/parsers/paratext-9/paratext-9-types.ts
index 263bbd7..9aa1c3c 100644
--- a/src/parsers/paratext-9/paratext-9-types.ts
+++ b/src/parsers/paratext-9/paratext-9-types.ts
@@ -25,7 +25,7 @@ declare module 'paratext-9-types' {
     lexemesId: string;
     /** Unique cluster id: LexemesId plus TextRange (e.g. "Word:a/Word:b/21-3"). */
     id: string;
-    /** Excluded flag. See [pt9-xml.md](../parsers/pt9-xml.md) for details. */
+    /** Excluded flag. See [pt9-xml.md](pt9-xml.md) for details. */
     excluded: boolean;
   }
 
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
index ea8d010..19fd2dc 100644
--- a/src/parsers/paratext-9/paratext9Converter.ts
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -45,7 +45,6 @@ function generateBookId(bookId: string): string {
 /**
  * Generates a deterministic ID for a segment (verse).
  *
- * @param bookId - Book ID.
  * @param verseRef - Verse reference (e.g., "MAT 1:1").
  * @returns A unique ID for the segment.
  */
@@ -124,7 +123,6 @@ function textRangeToAnchor(textRange: StringRange): string {
  *
  * @param verseRef - Verse reference (e.g., "MAT 1:1").
  * @param verseData - Verse data from Paratext 9.
- * @param bookId - Book ID for generating segment ID.
  * @param glossLanguage - Gloss language code.
  * @returns A Segment with occurrences converted from clusters and punctuations.
  */
@@ -198,11 +196,10 @@ function convertVerseToSegment(
  * @param interlinearData - Paratext 9 interlinear data.
  * @returns Map of analysis ID to Analysis object.
  */
-function createAnalyses(interlinearData: InterlinearData): Map<string, Analysis> {
+export function createAnalyses(interlinearData: InterlinearData): Map<string, Analysis> {
   const analyses = new Map<string, Analysis>();
   const { glossLanguage } = interlinearData;
 
-  // Collect all unique lexeme-sense pairs
   Object.values(interlinearData.verses).forEach((verseData) => {
     verseData.clusters.forEach((cluster) => {
       cluster.lexemes.forEach((lexeme) => {
@@ -257,9 +254,6 @@ export function convertParatext9ToInterlinearization(
   const interlinearizationId = generateInterlinearizationId(bookId);
   const analyzedBookId = generateBookId(bookId);
 
-  // Note: analyses are created but not returned - they're referenced via analysisId in assignments
-  createAnalyses(interlinearData);
-
   const segments = Object.entries(verses).map(([verseRef, verseData]) => {
     return convertVerseToSegment(verseRef, verseData, glossLanguage);
   });

From 005eb2ee5ed828e1ea1b5409d617df542bf04652 Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Thu, 19 Feb 2026 15:23:54 -0700
Subject: [PATCH 3/8] Refactor interlinearizer WebView for accessibility and
 update tests

- Change role from 'group' to 'radiogroup' for JSON view mode buttons to improve accessibility.
- Update button roles to 'radio' and aria attributes to 'aria-checked' for better semantic meaning.
- Modify tests to reflect the updated roles and ensure proper functionality of the JSON view mode switch.
---
 .../interlinearizer.web-view.test.tsx         | 20 +++++++++----------
 .../paratext-9/paratext9Converter.test.ts     |  1 +
 src/interlinearizer.web-view.tsx              | 11 ++++++----
 src/parsers/paratext-9/paratext9Converter.ts  | 16 ++++++---------
 4 files changed, 24 insertions(+), 24 deletions(-)

diff --git a/src/__tests__/interlinearizer.web-view.test.tsx b/src/__tests__/interlinearizer.web-view.test.tsx
index 7b25c59..eecb01c 100644
--- a/src/__tests__/interlinearizer.web-view.test.tsx
+++ b/src/__tests__/interlinearizer.web-view.test.tsx
@@ -107,11 +107,11 @@ describe('InterlinearizerWebView', () => {
   it('renders the JSON view mode switch (InterlinearData / Interlinearization / Analyses)', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
-    const group = screen.getByRole('group', { name: /json view mode/i });
-    expect(group).toBeInTheDocument();
-    expect(screen.getByRole('button', { name: /^interlineardata$/i })).toBeInTheDocument();
-    expect(screen.getByRole('button', { name: /^interlinearization$/i })).toBeInTheDocument();
-    expect(screen.getByRole('button', { name: /^analyses$/i })).toBeInTheDocument();
+    const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+    expect(radiogroup).toBeInTheDocument();
+    expect(screen.getByRole('radio', { name: /^interlineardata$/i })).toBeInTheDocument();
+    expect(screen.getByRole('radio', { name: /^interlinearization$/i })).toBeInTheDocument();
+    expect(screen.getByRole('radio', { name: /^analyses$/i })).toBeInTheDocument();
     expect(screen.getByText(/view json as:/i)).toBeInTheDocument();
   });
 
@@ -150,7 +150,7 @@ describe('InterlinearizerWebView', () => {
   it('switching to Interlinearization shows converted model JSON', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
-    fireEvent.click(screen.getByRole('button', { name: /^interlinearization$/i }));
+    fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
 
     expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
     expect(screen.getByText(/analysisLanguages/i)).toBeInTheDocument();
@@ -161,10 +161,10 @@ describe('InterlinearizerWebView', () => {
   it('switching back to InterlinearData shows PT9 structure JSON', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
-    fireEvent.click(screen.getByRole('button', { name: /^interlinearization$/i }));
+    fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
     expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
 
-    fireEvent.click(screen.getByRole('button', { name: /^interlineardata$/i }));
+    fireEvent.click(screen.getByRole('radio', { name: /^interlineardata$/i }));
 
     expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
     expect(screen.getByText(/glossLanguage/i)).toBeInTheDocument();
@@ -174,7 +174,7 @@ describe('InterlinearizerWebView', () => {
   it('switching to Analyses shows analysis map JSON from test data', () => {
     render(<InterlinearizerWebView {...testWebViewProps} />);
 
-    fireEvent.click(screen.getByRole('button', { name: /^analyses$/i }));
+    fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
 
     expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
     expect(mockCreateAnalyses).toHaveBeenCalledWith(stubInterlinearData);
@@ -187,7 +187,7 @@ describe('InterlinearizerWebView', () => {
     mockConvert.mockReturnValueOnce(undefined);
 
     const { container } = render(<InterlinearizerWebView {...testWebViewProps} />);
-    fireEvent.click(screen.getByRole('button', { name: /^interlinearization$/i }));
+    fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
 
     const jsonPre = container.querySelector('pre');
     expect(jsonPre).toBeInTheDocument();
diff --git a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
index f8a2600..842ff50 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
@@ -212,6 +212,7 @@ describe('convertParatext9ToInterlinearization', () => {
       };
       const result = convertParatext9ToInterlinearization(data);
 
+      expect(result.books[0].textVersion).toBe('H1');
       expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('approved');
     });
   });
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index b3808ba..a14a998 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -91,42 +91,45 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
             <span className="tw-text-sm tw-font-medium tw-text-foreground">View JSON as:</span>
             <div
               className="tw-inline-flex tw-rounded-md tw-border tw-border-border tw-bg-muted tw-p-0.5"
-              role="group"
+              role="radiogroup"
               aria-label="JSON view mode"
             >
               <button
                 type="button"
+                role="radio"
                 onClick={() => setJsonViewMode('interlinear-data')}
                 className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
                   jsonViewMode === 'interlinear-data'
                     ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
                     : 'tw-text-muted-foreground hover:tw-text-foreground'
                 }`}
-                aria-pressed={jsonViewMode === 'interlinear-data'}
+                aria-checked={jsonViewMode === 'interlinear-data'}
               >
                 InterlinearData
               </button>
               <button
                 type="button"
+                role="radio"
                 onClick={() => setJsonViewMode('interlinearization')}
                 className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
                   jsonViewMode === 'interlinearization'
                     ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
                     : 'tw-text-muted-foreground hover:tw-text-foreground'
                 }`}
-                aria-pressed={jsonViewMode === 'interlinearization'}
+                aria-checked={jsonViewMode === 'interlinearization'}
               >
                 Interlinearization
               </button>
               <button
                 type="button"
+                role="radio"
                 onClick={() => setJsonViewMode('analyses')}
                 className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
                   jsonViewMode === 'analyses'
                     ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
                     : 'tw-text-muted-foreground hover:tw-text-foreground'
                 }`}
-                aria-pressed={jsonViewMode === 'analyses'}
+                aria-checked={jsonViewMode === 'analyses'}
               >
                 Analyses
               </button>
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
index 19fd2dc..27ae517 100644
--- a/src/parsers/paratext-9/paratext9Converter.ts
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -134,23 +134,19 @@ function convertVerseToSegment(
   const segmentId = generateSegmentId(verseRef);
 
   const wordOccurrences = verseData.clusters.map((cluster, clusterIndex): Occurrence => {
+    const occurrenceId = generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex);
     const assignments = cluster.lexemes.map((lexeme): AnalysisAssignment => {
       const analysisId = generateAnalysisId(lexeme.lexemeId, lexeme.senseId, glossLanguage);
-      const assignmentId = generateAssignmentId(
-        generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex),
-        analysisId,
-      );
+      const assignmentId = generateAssignmentId(occurrenceId, analysisId);
 
       return {
         id: assignmentId,
-        occurrenceId: generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex),
+        occurrenceId,
         analysisId,
         status: verseData.hash ? AssignmentStatus.Approved : AssignmentStatus.Suggested,
       };
     });
 
-    const occurrenceId = generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex);
-
     return {
       id: occurrenceId,
       segmentId,
@@ -258,9 +254,9 @@ export function convertParatext9ToInterlinearization(
     return convertVerseToSegment(verseRef, verseData, glossLanguage);
   });
 
-  const verseDataArray = Object.values(verses);
-  const verseWithHash = verseDataArray.find((verseData) => verseData.hash);
-  const textVersion = verseWithHash?.hash || '';
+  const sortedVerseRefs = Object.keys(verses).sort();
+  const firstVerseRefWithHash = sortedVerseRefs.find((ref) => verses[ref].hash);
+  const textVersion = firstVerseRefWithHash !== undefined ? verses[firstVerseRefWithHash].hash : '';
 
   const analyzedBook: AnalyzedBook = {
     id: analyzedBookId,

From 44199a046803676d50d5ed8d7ac01fe6e21a3351 Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Thu, 19 Feb 2026 16:16:45 -0700
Subject: [PATCH 4/8] Add SHA-256 hash-based text version generation and
 converter support

- Introduce SHA-256 hashing for consistent book-level text version generation across Node and WebView environments.
- Add Web Crypto-based sha256HexWebCrypto for WebView-safe hashing; support injectable hashSha256Hex in converter options for Node (e.g. paranext-core generateHashFromBuffer).
- Compute book text version from sorted, concatenated verse hashes via computeBookTextVersion.
- Update paratext9Converter and tests to align with hash-generation behavior and remove obsolete code.
- Refactor interlinearizer WebView to use useEffect for async conversion and improve JSON view mode buttons.
- Update documentation for data structures and types.
---
 .../interlinearizer.web-view.test.tsx         | 100 +++++++----
 .../paratext-9/paratext9Converter.test.ts     | 169 ++++++++++++++----
 src/interlinearizer.web-view.tsx              |  95 +++++-----
 src/parsers/paratext-9/paratext9Converter.ts  |  64 ++++++-
 src/parsers/paratext-9/pt9-xml.md             |  10 +-
 5 files changed, 303 insertions(+), 135 deletions(-)

diff --git a/src/__tests__/interlinearizer.web-view.test.tsx b/src/__tests__/interlinearizer.web-view.test.tsx
index eecb01c..b5e0766 100644
--- a/src/__tests__/interlinearizer.web-view.test.tsx
+++ b/src/__tests__/interlinearizer.web-view.test.tsx
@@ -4,7 +4,7 @@
 
 import type { WebViewProps } from '@papi/core';
 import type { SerializedVerseRef } from '@sillsdev/scripture';
-import { fireEvent, render, screen } from '@testing-library/react';
+import { act, fireEvent, render, screen, waitFor } from '@testing-library/react';
 import type { InterlinearData } from 'paratext-9-types';
 
 /** Stub InterlinearData returned by the mocked parser. Matches shape the WebView displays. */
@@ -23,7 +23,7 @@ const stubInterlinearization = {
 };
 
 const mockParse = jest.fn().mockReturnValue(stubInterlinearData);
-const mockConvert = jest.fn().mockReturnValue(stubInterlinearization);
+const mockConvert = jest.fn().mockResolvedValue(stubInterlinearization);
 
 /** Stub analyses map for Analyses view (ID → Analysis). */
 const stubAnalysesMap = new Map([
@@ -88,15 +88,31 @@ const testWebViewProps: WebViewProps = {
   updateWebViewDefinition: () => true,
 };
 
+/**
+ * Renders the WebView and waits for the mount effect's async conversion to settle inside act(). The
+ * component calls convertParatext9ToInterlinearization(parsed) in useEffect; when the promise
+ * resolves it calls setInterlinearization. Without waiting, that update runs after the test and
+ * triggers "An update to ... was not wrapped in act(...)". This helper flushes the async work so
+ * all state updates are wrapped.
+ */
+async function renderWebView(): Promise<ReturnType<typeof render>> {
+  return act(async () => {
+    const result = render(<InterlinearizerWebView {...testWebViewProps} />);
+    await Promise.resolve();
+    await Promise.resolve();
+    return result;
+  });
+}
+
 describe('InterlinearizerWebView', () => {
-  it('renders the heading "Interlinearizer"', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('renders the heading "Interlinearizer"', async () => {
+    await renderWebView();
 
     expect(screen.getByRole('heading', { name: /interlinearizer/i })).toBeInTheDocument();
   });
 
-  it('renders the description mentioning test-data XML', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('renders the description mentioning test-data XML', async () => {
+    await renderWebView();
 
     expect(
       screen.getByText(/raw json of the model parsed from/i, { exact: false }),
@@ -104,8 +120,8 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/test-data\/Interlinear_en_MAT\.xml/i)).toBeInTheDocument();
   });
 
-  it('renders the JSON view mode switch (InterlinearData / Interlinearization / Analyses)', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('renders the JSON view mode switch (InterlinearData / Interlinearization / Analyses)', async () => {
+    await renderWebView();
 
     const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
     expect(radiogroup).toBeInTheDocument();
@@ -115,55 +131,58 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/view json as:/i)).toBeInTheDocument();
   });
 
-  it('displays InterlinearData JSON by default when parser returns data', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('displays InterlinearData JSON by default when parser returns data', async () => {
+    await renderWebView();
 
     expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
     expect(screen.getByText(/glossLanguage/i)).toBeInTheDocument();
     expect(screen.getByText(/bookId/i)).toBeInTheDocument();
   });
 
-  it('displays parsed structure including glossLanguage and bookId values', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('displays parsed structure including glossLanguage and bookId values', async () => {
+    await renderWebView();
 
     expect(screen.getByText(/"en"/)).toBeInTheDocument();
     expect(screen.getByText(/"MAT"/)).toBeInTheDocument();
   });
 
-  it('does not show parse error when parser succeeds', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('does not show parse error when parser succeeds', async () => {
+    await renderWebView();
 
     expect(screen.queryByText(/^parse error$/i)).not.toBeInTheDocument();
   });
 
-  it('displays parse error when parser throws an Error (uses err.message)', () => {
+  it('displays parse error when parser throws an Error (uses err.message)', async () => {
     mockParse.mockImplementationOnce(() => {
       throw new Error('Invalid XML structure');
     });
 
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+    await renderWebView();
 
     expect(screen.getByRole('heading', { name: /^parse error$/i })).toBeInTheDocument();
     expect(screen.getByText(/invalid xml structure/i)).toBeInTheDocument();
   });
 
-  it('switching to Interlinearization shows converted model JSON', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('switching to Interlinearization shows converted model JSON', async () => {
+    await renderWebView();
 
     fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
 
     expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
-    expect(screen.getByText(/analysisLanguages/i)).toBeInTheDocument();
-    expect(screen.getByText(/sourceWritingSystem/i)).toBeInTheDocument();
-    expect(screen.getByText(/segments/i)).toBeInTheDocument();
+    await waitFor(() => {
+      expect(screen.getByText(/analysisLanguages/i)).toBeInTheDocument();
+      expect(screen.getByText(/sourceWritingSystem/i)).toBeInTheDocument();
+      expect(screen.getByText(/segments/i)).toBeInTheDocument();
+    });
   });
 
-  it('switching back to InterlinearData shows PT9 structure JSON', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('switching back to InterlinearData shows PT9 structure JSON', async () => {
+    await renderWebView();
 
     fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
-    expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
-
+    await waitFor(() => {
+      expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
+    });
     fireEvent.click(screen.getByRole('radio', { name: /^interlineardata$/i }));
 
     expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
@@ -171,8 +190,8 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/bookId/i)).toBeInTheDocument();
   });
 
-  it('switching to Analyses shows analysis map JSON from test data', () => {
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+  it('switching to Analyses shows analysis map JSON from test data', async () => {
+    await renderWebView();
 
     fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
 
@@ -183,11 +202,14 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/paratext-9/i)).toBeInTheDocument();
   });
 
-  it('renders empty JSON pre when jsonToShow is undefined (converter returns undefined)', () => {
-    mockConvert.mockReturnValueOnce(undefined);
+  it('renders empty JSON pre when jsonToShow is undefined (converter returns undefined)', async () => {
+    mockConvert.mockResolvedValueOnce(undefined);
 
-    const { container } = render(<InterlinearizerWebView {...testWebViewProps} />);
+    const { container } = await renderWebView();
     fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
+    await waitFor(() => {
+      expect(container.querySelector('pre')).toBeInTheDocument();
+    });
 
     const jsonPre = container.querySelector('pre');
     expect(jsonPre).toBeInTheDocument();
@@ -195,16 +217,30 @@ describe('InterlinearizerWebView', () => {
     expect(jsonPre).not.toHaveTextContent('undefined');
   });
 
-  it('displays parse error when parser throws non-Error (uses String(err))', () => {
+  it('displays parse error when parser throws non-Error (uses String(err))', async () => {
     mockParse.mockImplementationOnce(() => {
       // Intentionally throw a non-Error to test the String(err) branch in the catch block.
       // eslint-disable-next-line no-throw-literal -- testing non-Error handling
       throw 'plain string error';
     });
 
-    render(<InterlinearizerWebView {...testWebViewProps} />);
+    await renderWebView();
 
     expect(screen.getByRole('heading', { name: /^parse error$/i })).toBeInTheDocument();
     expect(screen.getByText('plain string error')).toBeInTheDocument();
   });
+
+  it('sets interlinearization to undefined when converter rejects', async () => {
+    mockConvert.mockRejectedValueOnce(new Error('Conversion failed'));
+
+    const { container } = await renderWebView();
+    fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
+    await waitFor(() => {
+      expect(container.querySelector('pre')).toBeInTheDocument();
+    });
+
+    const jsonPre = container.querySelector('pre');
+    expect(jsonPre).toBeInTheDocument();
+    expect(jsonPre).toBeEmptyDOMElement();
+  });
 });
diff --git a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
index 842ff50..f9348ba 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
@@ -1,21 +1,38 @@
-/** @file Unit tests for {@link convertParatext9ToInterlinearization} and {@link createAnalyses}. */
+/**
+ * @file Unit tests for {@link convertParatext9ToInterlinearization} and {@link createAnalyses}.
+ * @jest-environment node
+ */
 /// <reference types="jest" />
 
+import { createHash } from 'crypto';
 import type { InterlinearData } from 'paratext-9-types';
 import {
   convertParatext9ToInterlinearization,
   createAnalyses,
 } from 'parsers/paratext-9/paratext9Converter';
 
+/** SHA-256 hex hasher using Node crypto. */
+function nodeSha256Hex(str: string): Promise<string> {
+  return Promise.resolve(createHash('sha256').update(str, 'utf8').digest('hex'));
+}
+
+/** Options for converter calls in tests: use Node crypto. */
+const nodeHashOptions = { hashSha256Hex: nodeSha256Hex };
+
+/** Expected textVersion for a single verse hash: SHA-256( hash ) in hex. */
+function expectedTextVersionForSingleHash(hash: string): string {
+  return createHash('sha256').update(hash, 'utf8').digest('hex');
+}
+
 describe('convertParatext9ToInterlinearization', () => {
   describe('top-level structure', () => {
-    it('produces Interlinearization with id, sourceWritingSystem, analysisLanguages, books', () => {
+    it('produces Interlinearization with id, sourceWritingSystem, analysisLanguages, books', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
         verses: {},
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result).toHaveProperty('id');
       expect(result).toHaveProperty('sourceWritingSystem', '');
@@ -25,46 +42,46 @@ describe('convertParatext9ToInterlinearization', () => {
       expect(Array.isArray(result.books)).toBe(true);
     });
 
-    it('uses bookId for interlinearization id (lowercase, spaces to dashes)', () => {
+    it('uses bookId for interlinearization id (lowercase, spaces to dashes)', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'RUT',
         verses: {},
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.id).toBe('rut-interlinear');
     });
 
-    it('produces id mat-interlinear when bookId is MAT', () => {
+    it('produces id mat-interlinear when bookId is MAT', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
         verses: {},
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.id).toBe('mat-interlinear');
     });
 
-    it('sets analysisLanguages from glossLanguage', () => {
+    it('sets analysisLanguages from glossLanguage', async () => {
       const data: InterlinearData = {
         glossLanguage: 'fr',
         bookId: 'GEN',
         verses: {},
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.analysisLanguages).toEqual(['fr']);
     });
 
-    it('produces exactly one AnalyzedBook with id, bookRef, textVersion, segments', () => {
+    it('produces exactly one AnalyzedBook with id, bookRef, textVersion, segments', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
         verses: {},
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books).toHaveLength(1);
       const book = result.books[0];
@@ -77,21 +94,95 @@ describe('convertParatext9ToInterlinearization', () => {
   });
 
   describe('empty verses', () => {
-    it('returns empty segments array and empty textVersion when verses is empty', () => {
+    it('returns empty segments array and empty textVersion when verses is empty', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
         verses: {},
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments).toEqual([]);
       expect(result.books[0].textVersion).toBe('');
     });
   });
 
+  describe('textVersion (composite book-level digest)', () => {
+    it('is empty when no verse has a hash', async () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': { hash: '', clusters: [], punctuations: [] },
+          'MAT 1:2': { hash: '', clusters: [], punctuations: [] },
+        },
+      };
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
+      expect(result.books[0].textVersion).toBe('');
+    });
+
+    it('is SHA-256 of sorted concatenated hashes when multiple verses have hashes', async () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:2': {
+            hash: 'hash2',
+            clusters: [],
+            punctuations: [],
+          },
+          'MAT 1:1': {
+            hash: 'hash1',
+            clusters: [],
+            punctuations: [],
+          },
+        },
+      };
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
+      const sortedHashes = ['hash1', 'hash2'].sort();
+      const expected = createHash('sha256').update(sortedHashes.join(''), 'utf8').digest('hex');
+      expect(result.books[0].textVersion).toBe(expected);
+    });
+
+    it('uses Web Crypto (sha256HexWebCrypto) when hashSha256Hex option is omitted', async () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': { hash: 'a', clusters: [], punctuations: [] },
+          'MAT 1:2': { hash: 'b', clusters: [], punctuations: [] },
+        },
+      };
+      const result = await convertParatext9ToInterlinearization(data);
+      const sortedHashes = ['a', 'b'].sort();
+      const expected = createHash('sha256').update(sortedHashes.join(''), 'utf8').digest('hex');
+      expect(result.books[0].textVersion).toBe(expected);
+    });
+
+    it('changes when any verse hash changes', async () => {
+      const base: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': { hash: 'h1', clusters: [], punctuations: [] },
+          'MAT 1:2': { hash: 'h2', clusters: [], punctuations: [] },
+        },
+      };
+      const result1 = await convertParatext9ToInterlinearization(base, nodeHashOptions);
+      const modified = {
+        ...base,
+        verses: {
+          ...base.verses,
+          'MAT 1:2': { ...base.verses['MAT 1:2'], hash: 'h2-modified' },
+        },
+      };
+      const result2 = await convertParatext9ToInterlinearization(modified, nodeHashOptions);
+      expect(result1.books[0].textVersion).not.toBe(result2.books[0].textVersion);
+    });
+  });
+
   describe('verse to segment conversion', () => {
-    it('converts one verse with one cluster to one segment with one word occurrence', () => {
+    it('converts one verse with one cluster to one segment with one word occurrence', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -111,7 +202,7 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments).toHaveLength(1);
       const seg = result.books[0].segments[0];
@@ -137,7 +228,7 @@ describe('convertParatext9ToInterlinearization', () => {
       expect(assign.id).toBe(`assign-${occ.id}-analysis-en-Word:word-sense1`);
     });
 
-    it('uses verse hash for textVersion and sets assignment status to approved when verse has hash', () => {
+    it('uses composite book-level digest for textVersion and sets assignment status to approved when verse has hash', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -157,15 +248,15 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
-      expect(result.books[0].textVersion).toBe('ABC123');
+      expect(result.books[0].textVersion).toBe(expectedTextVersionForSingleHash('ABC123'));
       expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('approved');
     });
   });
 
   describe('assignment status from verse hash', () => {
-    it('sets assignment status to suggested when verse has no hash', () => {
+    it('sets assignment status to suggested when verse has no hash', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -185,12 +276,12 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('suggested');
     });
 
-    it('sets assignment status to approved when verse has hash', () => {
+    it('sets assignment status to approved when verse has hash', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -210,15 +301,15 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
-      expect(result.books[0].textVersion).toBe('H1');
+      expect(result.books[0].textVersion).toBe(expectedTextVersionForSingleHash('H1'));
       expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('approved');
     });
   });
 
   describe('cluster with multiple lexemes', () => {
-    it('creates one word occurrence with multiple assignments (one per lexeme)', () => {
+    it('creates one word occurrence with multiple assignments (one per lexeme)', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -241,7 +332,7 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       const occ = result.books[0].segments[0].occurrences[0];
       expect(occ.assignments).toHaveLength(2);
@@ -254,7 +345,7 @@ describe('convertParatext9ToInterlinearization', () => {
   });
 
   describe('punctuation occurrences', () => {
-    it('converts punctuations to punctuation occurrences after word occurrences (surfaceText from afterText when present)', () => {
+    it('converts punctuations to punctuation occurrences after word occurrences (surfaceText from afterText when present)', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -280,7 +371,7 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       const seg = result.books[0].segments[0];
       expect(seg.occurrences).toHaveLength(2);
@@ -294,7 +385,7 @@ describe('convertParatext9ToInterlinearization', () => {
       expect(puncOcc.id).toBe('mat-1:1-punc-1-34-2');
     });
 
-    it('uses beforeText for surfaceText when afterText is empty', () => {
+    it('uses beforeText for surfaceText when afterText is empty', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -306,12 +397,12 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments[0].occurrences[0].surfaceText).toBe(',');
     });
 
-    it('uses empty surfaceText when both beforeText and afterText are empty', () => {
+    it('uses empty surfaceText when both beforeText and afterText are empty', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -323,14 +414,14 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments[0].occurrences[0].surfaceText).toBe('');
     });
   });
 
   describe('verse with no clusters', () => {
-    it('produces segment with empty occurrences when verse has no clusters and no punctuations', () => {
+    it('produces segment with empty occurrences when verse has no clusters and no punctuations', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -342,7 +433,7 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments).toHaveLength(1);
       expect(result.books[0].segments[0].occurrences).toEqual([]);
@@ -352,7 +443,7 @@ describe('convertParatext9ToInterlinearization', () => {
   });
 
   describe('lexeme without senseId', () => {
-    it('generates analysis id without sense suffix when senseId is empty', () => {
+    it('generates analysis id without sense suffix when senseId is empty', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -372,7 +463,7 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments[0].occurrences[0].assignments[0].analysisId).toBe(
         'analysis-en-Word:a',
@@ -381,7 +472,7 @@ describe('convertParatext9ToInterlinearization', () => {
   });
 
   describe('segment and occurrence IDs', () => {
-    it('generates segment id from verseRef (lowercase, spaces to dashes)', () => {
+    it('generates segment id from verseRef (lowercase, spaces to dashes)', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -401,12 +492,12 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       expect(result.books[0].segments[0].id).toBe('mat-1:1');
     });
 
-    it('generates occurrence id from segmentId, cluster id, and index', () => {
+    it('generates occurrence id from segmentId, cluster id, and index', async () => {
       const data: InterlinearData = {
         glossLanguage: 'en',
         bookId: 'MAT',
@@ -426,7 +517,7 @@ describe('convertParatext9ToInterlinearization', () => {
           },
         },
       };
-      const result = convertParatext9ToInterlinearization(data);
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
 
       const segId = result.books[0].segments[0].id;
       expect(result.books[0].segments[0].occurrences[0].id).toBe(`${segId}-occ-0-Word:word/0-4`);
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index a14a998..e13f43d 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -1,4 +1,4 @@
-import { useMemo, useState } from 'react';
+import { useEffect, useMemo, useState } from 'react';
 import type { InterlinearData } from 'paratext-9-types';
 import { Paratext9Parser } from 'parsers/paratext-9/paratext9Parser';
 import {
@@ -50,24 +50,38 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
     }
   }, []);
 
-  const interlinearization = useMemo(
-    () => (parsed ? convertParatext9ToInterlinearization(parsed) : undefined),
-    [parsed],
-  );
+  const [interlinearization, setInterlinearization] = useState<
+    Awaited<ReturnType<typeof convertParatext9ToInterlinearization>> | undefined
+  >(undefined);
+
+  useEffect(() => {
+    if (!parsed) {
+      setInterlinearization(undefined);
+      return;
+    }
+    let cancelled = false;
+    convertParatext9ToInterlinearization(parsed)
+      .then((result) => {
+        if (!cancelled) setInterlinearization(result);
+        return result;
+      })
+      .catch(() => {
+        if (!cancelled) setInterlinearization(undefined);
+      });
+    return () => {
+      cancelled = true;
+    };
+  }, [parsed]);
 
   /** Analyses map derived from parsed data (ID → Analysis); only defined when parsed exists. */
   const analysesMap = useMemo(() => (parsed ? createAnalyses(parsed) : undefined), [parsed]);
 
   /** Data to show as JSON: depends on selected view mode. */
-  const jsonToShow = (():
-    | typeof parsed
-    | ReturnType<typeof convertParatext9ToInterlinearization>
-    | Record<string, unknown>
-    | undefined => {
+  const jsonToShow = useMemo(() => {
     if (jsonViewMode === 'interlinearization') return interlinearization;
     if (jsonViewMode === 'analyses' && analysesMap) return Object.fromEntries(analysesMap);
     return parsed;
-  })();
+  }, [jsonViewMode, parsed, interlinearization, analysesMap]);
 
   return (
     <div className="tw-flex tw-flex-col tw-gap-4 tw-p-6">
@@ -94,45 +108,26 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
               role="radiogroup"
               aria-label="JSON view mode"
             >
-              <button
-                type="button"
-                role="radio"
-                onClick={() => setJsonViewMode('interlinear-data')}
-                className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
-                  jsonViewMode === 'interlinear-data'
-                    ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
-                    : 'tw-text-muted-foreground hover:tw-text-foreground'
-                }`}
-                aria-checked={jsonViewMode === 'interlinear-data'}
-              >
-                InterlinearData
-              </button>
-              <button
-                type="button"
-                role="radio"
-                onClick={() => setJsonViewMode('interlinearization')}
-                className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
-                  jsonViewMode === 'interlinearization'
-                    ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
-                    : 'tw-text-muted-foreground hover:tw-text-foreground'
-                }`}
-                aria-checked={jsonViewMode === 'interlinearization'}
-              >
-                Interlinearization
-              </button>
-              <button
-                type="button"
-                role="radio"
-                onClick={() => setJsonViewMode('analyses')}
-                className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
-                  jsonViewMode === 'analyses'
-                    ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
-                    : 'tw-text-muted-foreground hover:tw-text-foreground'
-                }`}
-                aria-checked={jsonViewMode === 'analyses'}
-              >
-                Analyses
-              </button>
+              {[
+                { key: 'interlinear-data' as const, label: 'InterlinearData' },
+                { key: 'interlinearization' as const, label: 'Interlinearization' },
+                { key: 'analyses' as const, label: 'Analyses' },
+              ].map(({ key, label }) => (
+                <button
+                  key={key}
+                  type="button"
+                  role="radio"
+                  onClick={() => setJsonViewMode(key)}
+                  className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
+                    jsonViewMode === key
+                      ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
+                      : 'tw-text-muted-foreground hover:tw-text-foreground'
+                  }`}
+                  aria-checked={jsonViewMode === key}
+                >
+                  {label}
+                </button>
+              ))}
             </div>
             <p className="tw-text-xs tw-text-muted-foreground">
               {getViewModeDescription(jsonViewMode)}
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
index 27ae517..66ffc96 100644
--- a/src/parsers/paratext-9/paratext9Converter.ts
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -22,6 +22,46 @@ import {
   Confidence,
 } from 'types/interlinearizer-enums';
 
+/**
+ * Default SHA-256 hex implementation using the Web Crypto API so the converter can run in WebViews.
+ *
+ * @param input - UTF-8 string to hash.
+ * @returns Promise that resolves to the hex-encoded SHA-256 digest.
+ */
+async function sha256HexWebCrypto(input: string): Promise<string> {
+  const encoder = new TextEncoder();
+  const data = encoder.encode(input);
+  const hashBuffer = await globalThis.crypto.subtle.digest('SHA-256', data);
+  const hashArray = Array.from(new Uint8Array(hashBuffer));
+  return hashArray.map((b) => b.toString(16).padStart(2, '0')).join('');
+}
+
+/**
+ * Computes a stable book-level text version from verse hashes.
+ *
+ * Collects all non-empty verse hashes, sorts them deterministically, concatenates them, and returns
+ * the SHA-256 digest in hex. Used so that textVersion reflects changes in any verse. Uses the
+ * provided hasher or the default Web Crypto implementation (for WebViews).
+ *
+ * @param verseDataArray - Verse data in deterministic (e.g. sorted by ref) order.
+ * @param hashSha256Hex - Optional hasher; when omitted, uses Web Crypto. In Node contexts pass one
+ *   that matches paranext-core's generateHashFromBuffer('sha256', 'hex', Buffer.from(str,
+ *   'utf8')).
+ * @returns Promise that resolves to the hex SHA-256 digest, or '' if no verse hashes.
+ */
+async function computeBookTextVersion(
+  verseDataArray: VerseData[],
+  hashSha256Hex: (input: string) => Promise<string>,
+): Promise<string> {
+  const nonEmptyHashes = verseDataArray
+    .map((vd) => vd.hash)
+    .filter((h): h is string => h.length > 0);
+  if (nonEmptyHashes.length === 0) return '';
+  const sortedHashes = [...nonEmptyHashes].sort();
+  const concatenated = sortedHashes.join('');
+  return hashSha256Hex(concatenated);
+}
+
 /**
  * Generates a deterministic ID for an interlinearization from Paratext 9 data.
  *
@@ -138,7 +178,6 @@ function convertVerseToSegment(
     const assignments = cluster.lexemes.map((lexeme): AnalysisAssignment => {
       const analysisId = generateAnalysisId(lexeme.lexemeId, lexeme.senseId, glossLanguage);
       const assignmentId = generateAssignmentId(occurrenceId, analysisId);
-
       return {
         id: assignmentId,
         occurrenceId,
@@ -146,7 +185,6 @@ function convertVerseToSegment(
         status: verseData.hash ? AssignmentStatus.Approved : AssignmentStatus.Suggested,
       };
     });
-
     return {
       id: occurrenceId,
       segmentId,
@@ -238,14 +276,22 @@ export function createAnalyses(interlinearData: InterlinearData): Map<string, An
  * them in a separate collection or attach them to a parent structure.
  *
  * @param interlinearData - Paratext 9 interlinear data to convert.
- * @param baselineTexts - Optional map of verse references to baseline text (for extracting
- *   surfaceText). If not provided, surfaceText will be empty strings.
- * @returns Converted Interlinearization object.
+ * @param options - Optional. hashSha256Hex: hasher for book-level text version; when omitted, uses
+ *   Web Crypto (for WebViews). In Node contexts use one that matches paranext-core's
+ *   generateHashFromBuffer('sha256', 'hex', Buffer.from(str, 'utf8')) for consistency.
+ * @returns Promise that resolves to the converted Interlinearization object.
  */
-export function convertParatext9ToInterlinearization(
+export type ConvertParatext9Options = {
+  /** SHA-256 hex hasher for composite book text version. Default: Web Crypto (WebView-safe). */
+  hashSha256Hex?: (input: string) => Promise<string>;
+};
+
+export async function convertParatext9ToInterlinearization(
   interlinearData: InterlinearData,
-): Interlinearization {
+  options?: ConvertParatext9Options,
+): Promise<Interlinearization> {
   const { glossLanguage, bookId, verses } = interlinearData;
+  const hashSha256Hex = options?.hashSha256Hex ?? sha256HexWebCrypto;
 
   const interlinearizationId = generateInterlinearizationId(bookId);
   const analyzedBookId = generateBookId(bookId);
@@ -255,8 +301,8 @@ export function convertParatext9ToInterlinearization(
   });
 
   const sortedVerseRefs = Object.keys(verses).sort();
-  const firstVerseRefWithHash = sortedVerseRefs.find((ref) => verses[ref].hash);
-  const textVersion = firstVerseRefWithHash !== undefined ? verses[firstVerseRefWithHash].hash : '';
+  const verseDataArray = sortedVerseRefs.map((ref) => verses[ref]);
+  const textVersion = await computeBookTextVersion(verseDataArray, hashSha256Hex);
 
   const analyzedBook: AnalyzedBook = {
     id: analyzedBookId,
diff --git a/src/parsers/paratext-9/pt9-xml.md b/src/parsers/paratext-9/pt9-xml.md
index 7cb7caf..6c8cd0a 100644
--- a/src/parsers/paratext-9/pt9-xml.md
+++ b/src/parsers/paratext-9/pt9-xml.md
@@ -41,12 +41,12 @@ The extension reads PT9 interlinear data from XML files (e.g. `Interlinear_<lang
 
 ## Parsed output (in-memory)
 
-The parser produces objects conforming to the types in `src/types/interlinearizer.d.ts`:
+The parser produces objects conforming to the types in `src/parsers/paratext-9/paratext-9-types.ts`:
 
-- **InterlinearData:** `GlossLanguage`, `BookId`, `Verses` (record of verse key → **VerseData**).
-- **VerseData:** `Hash`, `Clusters` (array of **ClusterData**), `Punctuations` (array of **PunctuationData**).
-- **ClusterData:** `TextRange` (`Index`, `Length`), `Lexemes` (array of `{ LexemeId, SenseId }`), `LexemesId` (slash-joined lexeme IDs), `Id` (cluster id: `LexemesId/Index-Length` or `Index-Length` when there are no lexemes), `Excluded` (boolean flag for location-specific exclusion).
-- **PunctuationData:** `TextRange`, `BeforeText`, `AfterText`.
+- **InterlinearData:** `glossLanguage`, `bookId`, `verses` (record of verse key → **VerseData**).
+- **VerseData:** `hash`, `clusters` (array of **ClusterData**), `punctuations` (array of **PunctuationData**).
+- **ClusterData:** `textRange` (`index`, `length`), `lexemes` (array of **LexemeData** `{ lexemeId, senseId }`), `lexemesId` (slash-joined lexeme IDs), `id` (cluster id: `lexemesId/index-length` or `index-length` when there are no lexemes), `excluded` (boolean flag for location-specific exclusion).
+- **PunctuationData:** `textRange`, `beforeText`, `afterText`.
 
 ## Example (minimal valid document)
 

From 8662c00e1d6bbc40b9617e1be40ab0877d5fa6b7 Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Thu, 19 Feb 2026 17:28:51 -0700
Subject: [PATCH 5/8] Update package configuration and enhance interlinearizer
 WebView functionality

- Add Node.js version requirement (>=18) to package.json and package-lock.json.
- Improve interlinearizer WebView by implementing keyboard navigation for JSON view modes, allowing users to switch between modes using arrow keys.
- Refactor related tests to ensure proper functionality of the new keyboard navigation feature.
- Update README to reflect the new Node.js requirement and clarify usage of test data paths.
---
 README.md                                     |   6 +-
 package-lock.json                             |   3 +
 package.json                                  |   3 +
 .../interlinearizer.web-view.test.tsx         | 167 +++++++++++++++++-
 .../paratext-9/paratext9Converter.test.ts     |   2 +-
 .../paratext-9/paratext9Parser.test.ts        |  12 +-
 src/__tests__/test-helpers.ts                 |  15 +-
 src/interlinearizer.web-view.tsx              |  61 +++++--
 src/parsers/paratext-9/paratext-9-types.ts    | 114 ++++++------
 src/parsers/paratext-9/paratext9Converter.ts  |   6 +-
 src/parsers/paratext-9/paratext9Parser.ts     |   6 +-
 src/types/interlinearizer-enums.ts            |   6 +-
 12 files changed, 308 insertions(+), 93 deletions(-)

diff --git a/README.md b/README.md
index 64ef32c..0e5b2da 100644
--- a/README.md
+++ b/README.md
@@ -108,7 +108,7 @@ The general file structure for an extension is as follows:
     - `assets/descriptions/description-<locale>.md` contains a brief description of the extension in the language specified by `<locale>`
 - `contributions/` contains JSON files the platform uses to extend data structures for things like menus and settings. The JSON files are referenced from the manifest
 - `public/` contains other static files that are copied into the build folder
-- `test-data/` contains sample interlinear XML (e.g. `Interlinear_en_MAT.xml`) for development and tests
+- `test-data/` contains sample interlinear XML (e.g. `Interlinear_en_MAT.xml`) for development and tests. In tests, resolve paths via `getTestDataPath('Interlinear_en_MAT.xml')` from `src/__tests__/test-helpers` rather than building paths with `..` segments.
 - `.github/` contains files to facilitate integration with GitHub
   - `.github/workflows` contains [GitHub Actions](https://github.com/features/actions) workflows for automating various processes in this repo (e.g. **Test** and **Lint** on push/PR to main, release-prep, hotfix-\*; **Publish** and **Bump Versions** manual dispatch; **CodeQL** for security)
   - `.github/assets/release-body.md` combined with a generated changelog becomes the body of [releases published using GitHub Actions](#publishing)
@@ -119,6 +119,10 @@ The general file structure for an extension is as follows:
 
 ## To install
 
+### Requirements
+
+- **Node.js >= 18** is required. The test suite uses the Web Crypto API (`globalThis.crypto.subtle`) for hashing in `paratext9Converter` tests (e.g. the `sha256HexWebCrypto` path in `src/__tests__/parsers/paratext-9/paratext9Converter.test.ts` when `convertParatext9ToInterlinearization` is called without the `hashSha256Hex` option). Node 18+ provides this API; older versions will cause those tests to fail. The same requirement is enforced in `package.json` via `engines.node` and is used by CI.
+
 ### Install dependencies:
 
 1. Follow the instructions to install [`paranext-core`](https://github.com/paranext/paranext-core#developer-install). We recommend you clone `paranext-core` in the same parent directory in which you cloned this repository so you do not have to [reconfigure paths](#configure-paths-to-paranext-core-repo) to `paranext-core`.
diff --git a/package-lock.json b/package-lock.json
index 080ad78..af7ddf1 100644
--- a/package-lock.json
+++ b/package-lock.json
@@ -73,6 +73,9 @@
         "webpack-merge": "^6.0.1",
         "zip-build": "^1.8.0"
       },
+      "engines": {
+        "node": ">=18"
+      },
       "peerDependencies": {
         "react": ">=18.3.1",
         "react-dom": ">=18.3.1"
diff --git a/package.json b/package.json
index 993e48e..ac6c990 100644
--- a/package.json
+++ b/package.json
@@ -6,6 +6,9 @@
   "types": "src/types/interlinearizer.d.ts",
   "author": "SIL Global",
   "license": "MIT",
+  "engines": {
+    "node": ">=18"
+  },
   "scripts": {
     "build:web-view": "webpack --config ./webpack/webpack.config.web-view.ts",
     "build:main": "webpack --config ./webpack/webpack.config.main.ts",
diff --git a/src/__tests__/interlinearizer.web-view.test.tsx b/src/__tests__/interlinearizer.web-view.test.tsx
index b5e0766..45e60a4 100644
--- a/src/__tests__/interlinearizer.web-view.test.tsx
+++ b/src/__tests__/interlinearizer.web-view.test.tsx
@@ -5,7 +5,8 @@
 import type { WebViewProps } from '@papi/core';
 import type { SerializedVerseRef } from '@sillsdev/scripture';
 import { act, fireEvent, render, screen, waitFor } from '@testing-library/react';
-import type { InterlinearData } from 'paratext-9-types';
+import React from 'react';
+import type { InterlinearData } from 'parsers/paratext-9/paratext-9-types';
 
 /** Stub InterlinearData returned by the mocked parser. Matches shape the WebView displays. */
 const stubInterlinearData: InterlinearData = {
@@ -202,6 +203,21 @@ describe('InterlinearizerWebView', () => {
     expect(screen.getByText(/paratext-9/i)).toBeInTheDocument();
   });
 
+  it('Analyses view shows empty JSON pre when createAnalyses returns undefined', async () => {
+    mockCreateAnalyses.mockReturnValueOnce(undefined);
+
+    const { container } = await renderWebView();
+    fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
+    await waitFor(() => {
+      expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
+    });
+
+    const jsonPre = container.querySelector('pre');
+    expect(jsonPre).toBeInTheDocument();
+    expect(jsonPre).toBeEmptyDOMElement();
+    expect(jsonPre).not.toHaveTextContent('undefined');
+  });
+
   it('renders empty JSON pre when jsonToShow is undefined (converter returns undefined)', async () => {
     mockConvert.mockResolvedValueOnce(undefined);
 
@@ -243,4 +259,153 @@ describe('InterlinearizerWebView', () => {
     expect(jsonPre).toBeInTheDocument();
     expect(jsonPre).toBeEmptyDOMElement();
   });
+
+  describe('handleJsonViewModeKeyDown', () => {
+    it('ArrowRight moves to next mode and updates selection', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowRight' });
+      });
+
+      expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
+      expect(screen.getByRole('radio', { name: /^interlinearization$/i })).toHaveAttribute(
+        'aria-checked',
+        'true',
+      );
+    });
+
+    it('ArrowDown moves to next mode', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowDown' });
+      });
+      expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowDown' });
+      });
+      expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
+    });
+
+    it('ArrowRight from last mode (Analyses) wraps to first (InterlinearData)', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
+      expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowRight' });
+      });
+
+      expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+      expect(screen.getByRole('radio', { name: /^interlineardata$/i })).toHaveAttribute(
+        'aria-checked',
+        'true',
+      );
+    });
+
+    it('ArrowLeft moves to previous mode', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
+      expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowLeft' });
+      });
+
+      expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
+      expect(screen.getByRole('radio', { name: /^interlinearization$/i })).toHaveAttribute(
+        'aria-checked',
+        'true',
+      );
+    });
+
+    it('ArrowUp moves to previous mode', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowUp' });
+      });
+
+      expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+      expect(screen.getByRole('radio', { name: /^interlineardata$/i })).toHaveAttribute(
+        'aria-checked',
+        'true',
+      );
+    });
+
+    it('ArrowLeft from first mode (InterlinearData) wraps to last (Analyses)', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowLeft' });
+      });
+
+      expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
+      expect(screen.getByRole('radio', { name: /^analyses$/i })).toHaveAttribute(
+        'aria-checked',
+        'true',
+      );
+    });
+
+    it('non-arrow key does not change mode', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+
+      fireEvent.keyDown(radiogroup, { key: 'a' });
+      fireEvent.keyDown(radiogroup, { key: 'Enter' });
+      expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
+      expect(screen.getByRole('radio', { name: /^interlineardata$/i })).toHaveAttribute(
+        'aria-checked',
+        'true',
+      );
+    });
+
+    it('moves focus to the newly selected radio on arrow key', async () => {
+      await renderWebView();
+      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const interlinearizationRadio = screen.getByRole('radio', {
+        name: /^interlinearization$/i,
+      });
+
+      await act(async () => {
+        fireEvent.keyDown(radiogroup, { key: 'ArrowRight' });
+      });
+
+      expect(document.activeElement).toBe(interlinearizationRadio);
+    });
+
+    it('does nothing when current view mode is not in JSON_VIEW_MODES (idx === -1)', async () => {
+      const setJsonViewMode = jest.fn();
+      let useStateCallCount = 0;
+      const useStateSpy = jest.spyOn(React, 'useState').mockImplementation(() => {
+        useStateCallCount += 1;
+        return useStateCallCount === 1 ? ['invalid', setJsonViewMode] : [undefined, jest.fn()];
+      });
+
+      try {
+        await renderWebView();
+        const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+
+        await act(async () => {
+          fireEvent.keyDown(radiogroup, { key: 'ArrowRight' });
+        });
+
+        expect(setJsonViewMode).not.toHaveBeenCalled();
+      } finally {
+        useStateSpy.mockRestore();
+      }
+    });
+  });
 });
diff --git a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
index f9348ba..f64a101 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
@@ -5,11 +5,11 @@
 /// <reference types="jest" />
 
 import { createHash } from 'crypto';
-import type { InterlinearData } from 'paratext-9-types';
 import {
   convertParatext9ToInterlinearization,
   createAnalyses,
 } from 'parsers/paratext-9/paratext9Converter';
+import type { InterlinearData } from 'parsers/paratext-9/paratext-9-types';
 
 /** SHA-256 hex hasher using Node crypto. */
 function nodeSha256Hex(str: string): Promise<string> {
diff --git a/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
index eed880b..ac9193d 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
@@ -2,9 +2,9 @@
 /// <reference types="jest" />
 
 import * as fs from 'fs';
-import * as path from 'path';
 
 import { Paratext9Parser } from 'parsers/paratext-9/paratext9Parser';
+import { getTestDataPath } from '../../test-helpers';
 
 describe('Paratext9Parser', () => {
   let parser: Paratext9Parser;
@@ -575,15 +575,7 @@ describe('Paratext9Parser', () => {
     });
 
     it('parses real test-data file without throwing', () => {
-      const xmlPath = path.join(
-        __dirname,
-        '..',
-        '..',
-        '..',
-        '..',
-        'test-data',
-        'Interlinear_en_MAT.xml',
-      );
+      const xmlPath = getTestDataPath('Interlinear_en_MAT.xml');
       const xml = fs.readFileSync(xmlPath, 'utf-8');
       const result = parser.parse(xml);
 
diff --git a/src/__tests__/test-helpers.ts b/src/__tests__/test-helpers.ts
index 2669edc..9c63a67 100644
--- a/src/__tests__/test-helpers.ts
+++ b/src/__tests__/test-helpers.ts
@@ -1,10 +1,23 @@
 /**
  * @file Test helpers used to build type-safe mocks without type assertions. Provides a minimal
- *   ExecutionActivationContext that satisfies @papi/core types.
+ *   ExecutionActivationContext that satisfies @papi/core types, and a stable path resolver for the
+ *   test-data directory.
  */
+import * as path from 'path';
+
 import type { ExecutionActivationContext } from '@papi/core';
 import { UnsubscriberAsyncList } from 'platform-bible-utils';
 
+/**
+ * Resolves a path to a file under the project's test-data directory.
+ *
+ * @param relativePath - Filename or path relative to test-data (e.g. 'Interlinear_en_MAT.xml').
+ * @returns Absolute path to the file under test-data.
+ */
+export function getTestDataPath(relativePath: string): string {
+  return path.resolve(__dirname, '..', '..', 'test-data', relativePath);
+}
+
 /** Minimal execution token-shaped object for tests (structural match for ExecutionToken). */
 const mockExecutionToken: {
   type: 'extension';
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index e13f43d..6de060b 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -1,11 +1,12 @@
-import { useEffect, useMemo, useState } from 'react';
-import type { InterlinearData } from 'paratext-9-types';
+import React, { useEffect, useMemo, useRef, useState } from 'react';
+import type { InterlinearData } from 'parsers/paratext-9/paratext-9-types';
 import { Paratext9Parser } from 'parsers/paratext-9/paratext9Parser';
 import {
   convertParatext9ToInterlinearization,
   createAnalyses,
 } from 'parsers/paratext-9/paratext9Converter';
 
+import type { Interlinearization } from 'interlinearizer';
 /** Test interlinear XML bundled at build time (from test-data/Interlinear_en_MAT.xml). */
 import testXml from '../test-data/Interlinear_en_MAT.xml?raw';
 
@@ -15,6 +16,13 @@ type ParseResult = { data: InterlinearData; error: undefined } | { data: undefin
 /** View mode for the JSON display: raw PT9, converted model, or analyses map. */
 type JsonViewMode = 'interlinear-data' | 'interlinearization' | 'analyses';
 
+/** Ordered list of JSON view modes for rendering and arrow-key navigation. */
+const JSON_VIEW_MODES: { key: JsonViewMode; label: string }[] = [
+  { key: 'interlinear-data', label: 'InterlinearData' },
+  { key: 'interlinearization', label: 'Interlinearization' },
+  { key: 'analyses', label: 'Analyses' },
+];
+
 function getViewModeDescription(mode: JsonViewMode): string {
   if (mode === 'interlinear-data') return 'Paratext 9 book/verse/cluster structure.';
   if (mode === 'interlinearization')
@@ -40,6 +48,34 @@ function getViewModeLabel(mode: JsonViewMode): string {
 globalThis.webViewComponent = function InterlinearizerWebView() {
   const [jsonViewMode, setJsonViewMode] = useState<JsonViewMode>('interlinear-data');
 
+  /** Refs to each radio button for moving focus on arrow-key navigation. */
+  const radioRefs = useRef<Record<JsonViewMode, HTMLButtonElement | undefined>>({
+    'interlinear-data': undefined,
+    interlinearization: undefined,
+    analyses: undefined,
+  });
+
+  /**
+   * Handles arrow keys on the JSON view mode radiogroup: Left/Up select previous, Right/Down select
+   * next; updates selection and moves focus to the new radio.
+   */
+  const handleJsonViewModeKeyDown = (e: React.KeyboardEvent<HTMLDivElement>) => {
+    const idx = JSON_VIEW_MODES.findIndex((m) => m.key === jsonViewMode);
+    if (idx === -1) return;
+    let nextKey: JsonViewMode | undefined;
+    if (e.key === 'ArrowRight' || e.key === 'ArrowDown') {
+      e.preventDefault();
+      nextKey = JSON_VIEW_MODES[(idx + 1) % JSON_VIEW_MODES.length].key;
+      setJsonViewMode(nextKey);
+      radioRefs.current[nextKey]?.focus();
+    } else if (e.key === 'ArrowLeft' || e.key === 'ArrowUp') {
+      e.preventDefault();
+      nextKey = JSON_VIEW_MODES[(idx - 1 + JSON_VIEW_MODES.length) % JSON_VIEW_MODES.length].key;
+      setJsonViewMode(nextKey);
+      radioRefs.current[nextKey]?.focus();
+    }
+  };
+
   const { data: parsed, error: parseError } = useMemo((): ParseResult => {
     const parser = new Paratext9Parser();
     try {
@@ -50,9 +86,7 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
     }
   }, []);
 
-  const [interlinearization, setInterlinearization] = useState<
-    Awaited<ReturnType<typeof convertParatext9ToInterlinearization>> | undefined
-  >(undefined);
+  const [interlinearization, setInterlinearization] = useState<Interlinearization | undefined>();
 
   useEffect(() => {
     if (!parsed) {
@@ -79,7 +113,8 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
   /** Data to show as JSON: depends on selected view mode. */
   const jsonToShow = useMemo(() => {
     if (jsonViewMode === 'interlinearization') return interlinearization;
-    if (jsonViewMode === 'analyses' && analysesMap) return Object.fromEntries(analysesMap);
+    if (jsonViewMode === 'analyses')
+      return analysesMap ? Object.fromEntries(analysesMap) : undefined;
     return parsed;
   }, [jsonViewMode, parsed, interlinearization, analysesMap]);
 
@@ -107,23 +142,25 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
               className="tw-inline-flex tw-rounded-md tw-border tw-border-border tw-bg-muted tw-p-0.5"
               role="radiogroup"
               aria-label="JSON view mode"
+              tabIndex={-1}
+              onKeyDown={handleJsonViewModeKeyDown}
             >
-              {[
-                { key: 'interlinear-data' as const, label: 'InterlinearData' },
-                { key: 'interlinearization' as const, label: 'Interlinearization' },
-                { key: 'analyses' as const, label: 'Analyses' },
-              ].map(({ key, label }) => (
+              {JSON_VIEW_MODES.map(({ key, label }) => (
                 <button
                   key={key}
+                  ref={(el) => {
+                    radioRefs.current[key] = el ?? undefined;
+                  }}
                   type="button"
                   role="radio"
+                  tabIndex={jsonViewMode === key ? 0 : -1}
+                  aria-checked={jsonViewMode === key}
                   onClick={() => setJsonViewMode(key)}
                   className={`tw-rounded tw-px-3 tw-py-1.5 tw-text-sm tw-font-medium tw-transition-colors ${
                     jsonViewMode === key
                       ? 'tw-bg-background tw-text-foreground tw-shadow-sm'
                       : 'tw-text-muted-foreground hover:tw-text-foreground'
                   }`}
-                  aria-checked={jsonViewMode === key}
                 >
                   {label}
                 </button>
diff --git a/src/parsers/paratext-9/paratext-9-types.ts b/src/parsers/paratext-9/paratext-9-types.ts
index 9aa1c3c..1ffd187 100644
--- a/src/parsers/paratext-9/paratext-9-types.ts
+++ b/src/parsers/paratext-9/paratext-9-types.ts
@@ -1,64 +1,62 @@
-declare module 'paratext-9-types' {
-  /** Character range in source text (Index, Length). */
-  export interface StringRange {
-    /** Start index of the range in the source text (0-based). */
-    index: number;
-    /** Number of characters in the range. */
-    length: number;
-  }
+/** Character range in source text (Index, Length). */
+export interface StringRange {
+  /** Start index of the range in the source text (0-based). */
+  index: number;
+  /** Number of characters in the range. */
+  length: number;
+}
 
-  /** Data on the interlinearization of a single lexeme. */
-  export interface LexemeData {
-    /** ID of the lexeme (e.g. from Lexicon; XML attribute Id). */
-    lexemeId: string;
-    /** ID of the sense/gloss used for this lexeme (XML attribute GlossId). */
-    senseId: string;
-  }
+/** Data on the interlinearization of a single lexeme. */
+export interface LexemeData {
+  /** ID of the lexeme (e.g. from Lexicon; XML attribute Id). */
+  lexemeId: string;
+  /** ID of the sense/gloss used for this lexeme (XML attribute GlossId). */
+  senseId: string;
+}
 
-  /** Data on the interlinearization of a cluster. */
-  export interface ClusterData {
-    /** Character range this cluster occupies in the verse text. */
-    textRange: StringRange;
-    /** Lexemes in this cluster, in order. */
-    lexemes: LexemeData[];
-    /** Slash-joined LexemeIds for this cluster (e.g. "Word:a/Word:b"). */
-    lexemesId: string;
-    /** Unique cluster id: LexemesId plus TextRange (e.g. "Word:a/Word:b/21-3"). */
-    id: string;
-    /** Excluded flag. See [pt9-xml.md](pt9-xml.md) for details. */
-    excluded: boolean;
-  }
+/** Data on the interlinearization of a cluster. */
+export interface ClusterData {
+  /** Character range this cluster occupies in the verse text. */
+  textRange: StringRange;
+  /** Lexemes in this cluster, in order. */
+  lexemes: LexemeData[];
+  /** Slash-joined LexemeIds for this cluster (e.g. "Word:a/Word:b"). */
+  lexemesId: string;
+  /** Unique cluster id: LexemesId plus TextRange (e.g. "Word:a/Word:b/21-3"). */
+  id: string;
+  /** Excluded flag. See [pt9-xml.md](pt9-xml.md) for details. */
+  excluded: boolean;
+}
 
-  /** Data on punctuation change. */
-  export interface PunctuationData {
-    /** Character range this punctuation occupies in the verse text. */
-    textRange: StringRange;
-    /** Punctuation text before the change (or empty). */
-    beforeText: string;
-    /** Punctuation text after the change (or empty). */
-    afterText: string;
-  }
+/** Data on punctuation change. */
+export interface PunctuationData {
+  /** Character range this punctuation occupies in the verse text. */
+  textRange: StringRange;
+  /** Punctuation text before the change (or empty). */
+  beforeText: string;
+  /** Punctuation text after the change (or empty). */
+  afterText: string;
+}
 
-  /** Interlinear data for a single verse. */
-  export interface VerseData {
-    /** Hash of verse text when approved; empty string if not approved. */
-    hash: string;
-    /** Lexeme clusters in this verse. */
-    clusters: ClusterData[];
-    /** Punctuation changes in this verse. */
-    punctuations: PunctuationData[];
-  }
+/** Interlinear data for a single verse. */
+export interface VerseData {
+  /** Hash of verse text when approved; empty string if not approved. */
+  hash: string;
+  /** Lexeme clusters in this verse. */
+  clusters: ClusterData[];
+  /** Punctuation changes in this verse. */
+  punctuations: PunctuationData[];
+}
 
-  /** Root interlinear data: book + verses. */
-  export interface InterlinearData {
-    /** Language code or name for the glosses. */
-    glossLanguage: string;
-    /** Book id (e.g. "RUT", "MAT"). */
-    bookId: string;
-    /**
-     * Verse data keyed by verse reference (e.g. "RUT 3:1"). Exactly one entry per reference; the
-     * parser rejects XML that contains duplicate verse references.
-     */
-    verses: Record<string, VerseData>;
-  }
+/** Root interlinear data: book + verses. */
+export interface InterlinearData {
+  /** Language code or name for the glosses. */
+  glossLanguage: string;
+  /** Book id (e.g. "RUT", "MAT"). */
+  bookId: string;
+  /**
+   * Verse data keyed by verse reference (e.g. "RUT 3:1"). Exactly one entry per reference; the
+   * parser rejects XML that contains duplicate verse references.
+   */
+  verses: Record<string, VerseData>;
 }
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
index 66ffc96..740f350 100644
--- a/src/parsers/paratext-9/paratext9Converter.ts
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -6,7 +6,6 @@
  *   interlinearizer's book/segment/occurrence/analysis structure.
  */
 
-import type { InterlinearData, VerseData, StringRange } from 'paratext-9-types';
 import type {
   Interlinearization,
   AnalyzedBook,
@@ -21,6 +20,7 @@ import {
   AssignmentStatus,
   Confidence,
 } from 'types/interlinearizer-enums';
+import type { InterlinearData, VerseData, StringRange } from './paratext-9-types';
 
 /**
  * Default SHA-256 hex implementation using the Web Crypto API so the converter can run in WebViews.
@@ -295,13 +295,13 @@ export async function convertParatext9ToInterlinearization(
 
   const interlinearizationId = generateInterlinearizationId(bookId);
   const analyzedBookId = generateBookId(bookId);
+  const sortedVerseRefs = Object.keys(verses).sort();
+  const verseDataArray = sortedVerseRefs.map((ref) => verses[ref]);
 
   const segments = Object.entries(verses).map(([verseRef, verseData]) => {
     return convertVerseToSegment(verseRef, verseData, glossLanguage);
   });
 
-  const sortedVerseRefs = Object.keys(verses).sort();
-  const verseDataArray = sortedVerseRefs.map((ref) => verses[ref]);
   const textVersion = await computeBookTextVersion(verseDataArray, hashSha256Hex);
 
   const analyzedBook: AnalyzedBook = {
diff --git a/src/parsers/paratext-9/paratext9Parser.ts b/src/parsers/paratext-9/paratext9Parser.ts
index ce9372e..cfd9ebb 100644
--- a/src/parsers/paratext-9/paratext9Parser.ts
+++ b/src/parsers/paratext-9/paratext9Parser.ts
@@ -6,7 +6,7 @@ import type {
   StringRange,
   InterlinearData,
   VerseData,
-} from 'paratext-9-types';
+} from './paratext-9-types';
 
 /** Range: Index and Length attributes. */
 interface ParsedRange {
@@ -174,8 +174,8 @@ function extractClustersFromVerse(verseDataElement: ParsedVerseData): ClusterDat
  * Parses interlinear XML strings into {@link InterlinearData} using fast-xml-parser.
  *
  * Input is a raw XML string (caller is responsible for obtaining it, e.g. from file or network).
- * Output matches the types in `interlinearizer`; no extra conversion is done. Expects the
- * interlinear XML schema described in [pt9-xml.md](pt9-xml.md).
+ * Output matches the types in `paratext-9-types`; no extra conversion is done. Expects the Paratext
+ * 9 Interlinear XML schema described in [pt9-xml.md](pt9-xml.md).
  */
 export class Paratext9Parser {
   private readonly parser: XMLParser;
diff --git a/src/types/interlinearizer-enums.ts b/src/types/interlinearizer-enums.ts
index 5ea8052..238baa4 100644
--- a/src/types/interlinearizer-enums.ts
+++ b/src/types/interlinearizer-enums.ts
@@ -30,10 +30,10 @@ export enum AnalysisType {
 /**
  * How the analysis was produced.
  *
- * - `high`
- * - `medium`
- * - `low`
  * - `guess`
+ * - `low`
+ * - `medium`
+ * - `high`
  */
 export enum Confidence {
   Guess = 'guess',

From f8ba187900fec4fc4b7316fdea9d9e90acdeaf2a Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Thu, 19 Feb 2026 17:54:45 -0700
Subject: [PATCH 6/8] Enhance interlinearizer WebView with conversion status
 and keyboard navigation improvements

- Export `JsonViewMode` type and add a sentinel for conversion status to indicate when interlinearization is in progress.
- Implement `formatJsonPreContent` function to display "Converting..." during the conversion process.
- Refactor keyboard navigation handling for JSON view modes, improving the separation of concerns and testability.
- Update tests to verify the new conversion status display and ensure keyboard navigation functionality works as expected.
---
 .../interlinearizer.web-view.test.tsx         |  72 ++++++++----
 src/interlinearizer.web-view.tsx              | 110 +++++++++++++-----
 src/parsers/paratext-9/paratext9Converter.ts  |   7 +-
 3 files changed, 134 insertions(+), 55 deletions(-)

diff --git a/src/__tests__/interlinearizer.web-view.test.tsx b/src/__tests__/interlinearizer.web-view.test.tsx
index 45e60a4..33c6d1f 100644
--- a/src/__tests__/interlinearizer.web-view.test.tsx
+++ b/src/__tests__/interlinearizer.web-view.test.tsx
@@ -5,7 +5,6 @@
 import type { WebViewProps } from '@papi/core';
 import type { SerializedVerseRef } from '@sillsdev/scripture';
 import { act, fireEvent, render, screen, waitFor } from '@testing-library/react';
-import React from 'react';
 import type { InterlinearData } from 'parsers/paratext-9/paratext-9-types';
 
 /** Stub InterlinearData returned by the mocked parser. Matches shape the WebView displays. */
@@ -56,6 +55,9 @@ jest.mock('parsers/paratext-9/paratext9Converter', () => ({
   createAnalyses: mockCreateAnalyses,
 }));
 
+// eslint-disable-next-line import/first -- import order required for Jest mock initialization
+import * as interlinearizerWebViewModule from '../interlinearizer.web-view';
+
 /**
  * Load the WebView module; it assigns the component to globalThis.webViewComponent. This pattern is
  * required by the Platform.Bible WebView framework: the WebView entry is built with a ?inline query
@@ -63,9 +65,9 @@ jest.mock('parsers/paratext-9/paratext9Converter', () => ({
  * component must require() the module and read globalThis. If the WebView export mechanism changes,
  * update this test accordingly.
  */
-require('../interlinearizer.web-view');
 
 const InterlinearizerWebView = globalThis.webViewComponent;
+const { handleJsonViewModeKeyDown } = interlinearizerWebViewModule;
 if (!InterlinearizerWebView) throw new Error('webViewComponent not loaded');
 
 /** Minimal SerializedVerseRef for hook mock return. */
@@ -106,6 +108,10 @@ async function renderWebView(): Promise<ReturnType<typeof render>> {
 }
 
 describe('InterlinearizerWebView', () => {
+  beforeEach(() => {
+    jest.clearAllMocks();
+  });
+
   it('renders the heading "Interlinearizer"', async () => {
     await renderWebView();
 
@@ -170,11 +176,9 @@ describe('InterlinearizerWebView', () => {
     fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
 
     expect(screen.getByText(/^Interlinearization \(JSON\):$/)).toBeInTheDocument();
-    await waitFor(() => {
-      expect(screen.getByText(/analysisLanguages/i)).toBeInTheDocument();
-      expect(screen.getByText(/sourceWritingSystem/i)).toBeInTheDocument();
-      expect(screen.getByText(/segments/i)).toBeInTheDocument();
-    });
+    await waitFor(() => expect(screen.getByText(/analysisLanguages/i)).toBeInTheDocument());
+    await waitFor(() => expect(screen.getByText(/sourceWritingSystem/i)).toBeInTheDocument());
+    await waitFor(() => expect(screen.getByText(/segments/i)).toBeInTheDocument());
   });
 
   it('switching back to InterlinearData shows PT9 structure JSON', async () => {
@@ -233,6 +237,36 @@ describe('InterlinearizerWebView', () => {
     expect(jsonPre).not.toHaveTextContent('undefined');
   });
 
+  it('shows "Converting..." in Interlinearization view while conversion is in flight', async () => {
+    let resolveConvert: ((value: typeof stubInterlinearization) => void) | undefined;
+    const convertPromise = new Promise<typeof stubInterlinearization>((resolve) => {
+      resolveConvert = resolve;
+    });
+    mockConvert.mockReturnValueOnce(convertPromise);
+
+    const { container } = await act(async () => {
+      const result = render(<InterlinearizerWebView {...testWebViewProps} />);
+      await Promise.resolve();
+      return result;
+    });
+
+    fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
+
+    await waitFor(() => {
+      const jsonPre = container.querySelector('pre');
+      expect(jsonPre).toHaveTextContent('Converting...');
+    });
+
+    await act(async () => {
+      if (resolveConvert) resolveConvert(stubInterlinearization);
+      await convertPromise;
+    });
+
+    await waitFor(() => {
+      expect(screen.getByText(/analysisLanguages/i)).toBeInTheDocument();
+    });
+  });
+
   it('displays parse error when parser throws non-Error (uses String(err))', async () => {
     mockParse.mockImplementationOnce(() => {
       // Intentionally throw a non-Error to test the String(err) branch in the catch block.
@@ -386,26 +420,14 @@ describe('InterlinearizerWebView', () => {
       expect(document.activeElement).toBe(interlinearizationRadio);
     });
 
-    it('does nothing when current view mode is not in JSON_VIEW_MODES (idx === -1)', async () => {
+    it('does nothing when current view mode is not in JSON_VIEW_MODES (idx === -1)', () => {
       const setJsonViewMode = jest.fn();
-      let useStateCallCount = 0;
-      const useStateSpy = jest.spyOn(React, 'useState').mockImplementation(() => {
-        useStateCallCount += 1;
-        return useStateCallCount === 1 ? ['invalid', setJsonViewMode] : [undefined, jest.fn()];
-      });
-
-      try {
-        await renderWebView();
-        const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
-
-        await act(async () => {
-          fireEvent.keyDown(radiogroup, { key: 'ArrowRight' });
-        });
+      const focusRadio = jest.fn();
+      // Pass a value not in JSON_VIEW_MODES so findIndex returns -1; handler takes string for testability.
+      handleJsonViewModeKeyDown('invalid', 'ArrowRight', setJsonViewMode, focusRadio);
 
-        expect(setJsonViewMode).not.toHaveBeenCalled();
-      } finally {
-        useStateSpy.mockRestore();
-      }
+      expect(setJsonViewMode).not.toHaveBeenCalled();
+      expect(focusRadio).not.toHaveBeenCalled();
     });
   });
 });
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index 6de060b..5762a73 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -14,7 +14,13 @@ import testXml from '../test-data/Interlinear_en_MAT.xml?raw';
 type ParseResult = { data: InterlinearData; error: undefined } | { data: undefined; error: string };
 
 /** View mode for the JSON display: raw PT9, converted model, or analyses map. */
-type JsonViewMode = 'interlinear-data' | 'interlinearization' | 'analyses';
+export type JsonViewMode = 'interlinear-data' | 'interlinearization' | 'analyses';
+
+/**
+ * Sentinel returned by jsonToShow when interlinearization mode is selected but conversion is still
+ * in progress.
+ */
+export const JSON_SHOW_CONVERTING = Symbol('JSON_SHOW_CONVERTING');
 
 /** Ordered list of JSON view modes for rendering and arrow-key navigation. */
 const JSON_VIEW_MODES: { key: JsonViewMode; label: string }[] = [
@@ -36,6 +42,49 @@ function getViewModeLabel(mode: JsonViewMode): string {
   return 'Analyses (JSON):';
 }
 
+/** Renders jsonToShow for the <pre>: "Converting…" for sentinel, stringified JSON, or empty string. */
+function formatJsonPreContent(jsonToShow: unknown): string {
+  if (jsonToShow === JSON_SHOW_CONVERTING) return 'Converting...';
+  if (jsonToShow !== undefined) return JSON.stringify(jsonToShow, undefined, 2);
+  return '';
+}
+
+/**
+ * Pure handler for arrow-key navigation on the JSON view mode radiogroup. Left/Up select previous,
+ * Right/Down select next. Exported for unit testing.
+ *
+ * @param currentMode - Current JSON view mode as string (must be in {@link JSON_VIEW_MODES} or
+ *   no-op).
+ * @param eventKey - KeyboardEvent.key (e.g. 'ArrowRight', 'ArrowLeft').
+ * @param setJsonViewMode - State setter for view mode.
+ * @param focusRadio - Callback to focus the radio for a given mode (e.g.
+ *   refs.current[key]?.focus()).
+ * @returns True if the key was handled (caller should call event.preventDefault()).
+ */
+export function handleJsonViewModeKeyDown(
+  currentMode: string,
+  eventKey: string,
+  setJsonViewMode: (mode: JsonViewMode) => void,
+  focusRadio: (mode: JsonViewMode) => void,
+): boolean {
+  const idx = JSON_VIEW_MODES.findIndex((m) => m.key === currentMode);
+  if (idx === -1) return false;
+  if (eventKey === 'ArrowRight' || eventKey === 'ArrowDown') {
+    const nextKey = JSON_VIEW_MODES[(idx + 1) % JSON_VIEW_MODES.length].key;
+    setJsonViewMode(nextKey);
+    focusRadio(nextKey);
+    return true;
+  }
+  if (eventKey === 'ArrowLeft' || eventKey === 'ArrowUp') {
+    const nextKey =
+      JSON_VIEW_MODES[(idx - 1 + JSON_VIEW_MODES.length) % JSON_VIEW_MODES.length].key;
+    setJsonViewMode(nextKey);
+    focusRadio(nextKey);
+    return true;
+  }
+  return false;
+}
+
 /**
  * Main interlinearizer WebView. Parses the bundled test XML into the interlinear model and displays
  * the result as raw JSON. No PAPI commands or file loading—everything is self-contained.
@@ -55,24 +104,14 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
     analyses: undefined,
   });
 
-  /**
-   * Handles arrow keys on the JSON view mode radiogroup: Left/Up select previous, Right/Down select
-   * next; updates selection and moves focus to the new radio.
-   */
-  const handleJsonViewModeKeyDown = (e: React.KeyboardEvent<HTMLDivElement>) => {
-    const idx = JSON_VIEW_MODES.findIndex((m) => m.key === jsonViewMode);
-    if (idx === -1) return;
-    let nextKey: JsonViewMode | undefined;
-    if (e.key === 'ArrowRight' || e.key === 'ArrowDown') {
+  /** Wires arrow-key events to the pure handler and prevents default when handled. */
+  const onJsonViewModeKeyDown = (e: React.KeyboardEvent<HTMLDivElement>) => {
+    if (
+      handleJsonViewModeKeyDown(jsonViewMode, e.key, setJsonViewMode, (key) =>
+        radioRefs.current[key]?.focus(),
+      )
+    ) {
       e.preventDefault();
-      nextKey = JSON_VIEW_MODES[(idx + 1) % JSON_VIEW_MODES.length].key;
-      setJsonViewMode(nextKey);
-      radioRefs.current[nextKey]?.focus();
-    } else if (e.key === 'ArrowLeft' || e.key === 'ArrowUp') {
-      e.preventDefault();
-      nextKey = JSON_VIEW_MODES[(idx - 1 + JSON_VIEW_MODES.length) % JSON_VIEW_MODES.length].key;
-      setJsonViewMode(nextKey);
-      radioRefs.current[nextKey]?.focus();
     }
   };
 
@@ -87,20 +126,33 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
   }, []);
 
   const [interlinearization, setInterlinearization] = useState<Interlinearization | undefined>();
+  /**
+   * True once the convert promise has resolved or rejected; used to show "Converting…" only while
+   * in flight.
+   */
+  const [conversionSettled, setConversionSettled] = useState(false);
 
   useEffect(() => {
     if (!parsed) {
       setInterlinearization(undefined);
+      setConversionSettled(false);
       return;
     }
+    setConversionSettled(false);
     let cancelled = false;
     convertParatext9ToInterlinearization(parsed)
       .then((result) => {
-        if (!cancelled) setInterlinearization(result);
+        if (!cancelled) {
+          setInterlinearization(result);
+          setConversionSettled(true);
+        }
         return result;
       })
       .catch(() => {
-        if (!cancelled) setInterlinearization(undefined);
+        if (!cancelled) {
+          setInterlinearization(undefined);
+          setConversionSettled(true);
+        }
       });
     return () => {
       cancelled = true;
@@ -110,13 +162,19 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
   /** Analyses map derived from parsed data (ID → Analysis); only defined when parsed exists. */
   const analysesMap = useMemo(() => (parsed ? createAnalyses(parsed) : undefined), [parsed]);
 
-  /** Data to show as JSON: depends on selected view mode. */
-  const jsonToShow = useMemo(() => {
-    if (jsonViewMode === 'interlinearization') return interlinearization;
+  /**
+   * Data to show as JSON: depends on selected view mode. Shows converting sentinel when in
+   * interlinearization mode and conversion has not yet settled (promise still in flight).
+   */
+  const jsonToShow = useMemo((): unknown => {
+    if (jsonViewMode === 'interlinearization') {
+      if (interlinearization === undefined && !conversionSettled) return JSON_SHOW_CONVERTING;
+      return interlinearization;
+    }
     if (jsonViewMode === 'analyses')
       return analysesMap ? Object.fromEntries(analysesMap) : undefined;
     return parsed;
-  }, [jsonViewMode, parsed, interlinearization, analysesMap]);
+  }, [jsonViewMode, parsed, interlinearization, conversionSettled, analysesMap]);
 
   return (
     <div className="tw-flex tw-flex-col tw-gap-4 tw-p-6">
@@ -143,7 +201,7 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
               role="radiogroup"
               aria-label="JSON view mode"
               tabIndex={-1}
-              onKeyDown={handleJsonViewModeKeyDown}
+              onKeyDown={onJsonViewModeKeyDown}
             >
               {JSON_VIEW_MODES.map(({ key, label }) => (
                 <button
@@ -172,7 +230,7 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
           </div>
           <p className="tw-text-sm tw-text-muted-foreground">{getViewModeLabel(jsonViewMode)}</p>
           <pre className="tw-overflow-auto tw-rounded-md tw-border tw-border-border tw-bg-muted tw-p-4 tw-text-sm tw-font-mono tw-leading-relaxed">
-            {jsonToShow ? JSON.stringify(jsonToShow, undefined, 2) : ''}
+            {formatJsonPreContent(jsonToShow)}
           </pre>
         </>
       )}
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
index 740f350..238ba28 100644
--- a/src/parsers/paratext-9/paratext9Converter.ts
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -297,10 +297,9 @@ export async function convertParatext9ToInterlinearization(
   const analyzedBookId = generateBookId(bookId);
   const sortedVerseRefs = Object.keys(verses).sort();
   const verseDataArray = sortedVerseRefs.map((ref) => verses[ref]);
-
-  const segments = Object.entries(verses).map(([verseRef, verseData]) => {
-    return convertVerseToSegment(verseRef, verseData, glossLanguage);
-  });
+  const segments = sortedVerseRefs.map((ref) =>
+    convertVerseToSegment(ref, verses[ref], glossLanguage),
+  );
 
   const textVersion = await computeBookTextVersion(verseDataArray, hashSha256Hex);
 

From 3f135ea9eac3699dda93b6f406e0ac1e467672c4 Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Fri, 20 Feb 2026 15:48:29 -0700
Subject: [PATCH 7/8] Update interlinearizer WebView and tests with Lexicon
 integration and gloss lookup functionality

- Enhance the interlinearizer WebView to utilize a Lexicon XML file for gloss text lookup, allowing for more accurate display of glosses in analyses.
- Modify the `createAnalyses` function to accept an optional gloss lookup, improving the generation of analysis objects with real gloss text.
- Update Jest tests to cover new gloss lookup scenarios, ensuring proper handling of gloss text retrieval and fallback mechanisms.
- Revise README to include details about Lexicon XML structure and its integration with the interlinearizer.
---
 README.md                                     |    4 +-
 __mocks__/lexiconXmlContent.ts                |    9 +
 cspell.json                                   |    1 +
 jest.config.ts                                |    2 +
 .../interlinearizer.web-view.test.tsx         |  119 +-
 .../parsers/paratext-9/lexiconParser.test.ts  |  269 ++
 .../paratext-9/paratext9Converter.test.ts     |  150 +
 .../paratext-9/paratext9Parser.test.ts        |   11 +-
 src/interlinearizer.web-view.tsx              |   29 +-
 .../paratext-9/__mocks__/lexiconParser.ts     |   10 +
 .../__mocks__/paratext9Converter.ts           |   35 +
 .../paratext-9/__mocks__/paratext9Parser.ts   |   20 +
 src/parsers/paratext-9/lexiconParser.ts       |  184 +
 src/parsers/paratext-9/paratext9Converter.ts  |  137 +-
 src/parsers/paratext-9/pt9-xml.md             |   22 +-
 test-data/Interlinear_en_MAT.xml              |  254 +-
 test-data/Lexicon.xml                         | 4232 +++++++++++++++++
 17 files changed, 5221 insertions(+), 267 deletions(-)
 create mode 100644 __mocks__/lexiconXmlContent.ts
 create mode 100644 src/__tests__/parsers/paratext-9/lexiconParser.test.ts
 create mode 100644 src/parsers/paratext-9/__mocks__/lexiconParser.ts
 create mode 100644 src/parsers/paratext-9/__mocks__/paratext9Converter.ts
 create mode 100644 src/parsers/paratext-9/__mocks__/paratext9Parser.ts
 create mode 100644 src/parsers/paratext-9/lexiconParser.ts
 create mode 100644 test-data/Lexicon.xml

diff --git a/README.md b/README.md
index 0e5b2da..2b0e2de 100644
--- a/README.md
+++ b/README.md
@@ -101,14 +101,14 @@ The general file structure for an extension is as follows:
   - `*.web-view.scss` files provide styles for WebViews
   - `*.web-view.html` files are a conventional way to provide HTML WebViews (no special functionality)
   - `src/__tests__/` contains unit tests (Jest) for the extension, including parser tests (valid and invalid XML, edge cases) and web-view tests
-- `__mocks__/` contains Jest mocks for the PAPI, file modules, and test fixtures used by tests in `src/__tests__/`. The `@papi/backend` and `@papi/frontend` mocks are used mutually exclusively (backend for main.ts tests, frontend for WebView tests); each mock file ends with `export {}` so TypeScript treats it as a module.
+- `__mocks__/` (project root) contains Jest mocks for the PAPI, file modules, and test fixtures used by tests in `src/__tests__/`. Manual mocks for the Paratext 9 parser, converter, and lexicon used by `interlinearizer.web-view.test.tsx` live in `src/parsers/paratext-9/__mocks__/` (adjacent to the modules) so that `jest.mock('parsers/paratext-9/...')` picks them up.
 - `assets/` contains asset files the extension and its WebViews can retrieve using the `papi-extension:` protocol, as well as textual descriptions in various languages. It is copied into the build folder
   - `assets/displayData.json` contains (optionally) a path to the extension's icon file as well as text for the extension's display name, short summary, and path to the full description file
   - `assets/descriptions/` contains textual descriptions of the extension in various languages
     - `assets/descriptions/description-<locale>.md` contains a brief description of the extension in the language specified by `<locale>`
 - `contributions/` contains JSON files the platform uses to extend data structures for things like menus and settings. The JSON files are referenced from the manifest
 - `public/` contains other static files that are copied into the build folder
-- `test-data/` contains sample interlinear XML (e.g. `Interlinear_en_MAT.xml`) for development and tests. In tests, resolve paths via `getTestDataPath('Interlinear_en_MAT.xml')` from `src/__tests__/test-helpers` rather than building paths with `..` segments.
+- `test-data/` contains sample interlinear XML (e.g. `Interlinear_en_MAT.xml`) for development and tests. In tests, resolve paths via `getTestDataPath('Interlinear_en_MAT.xml')` from `src/__tests__/test-helpers`.
 - `.github/` contains files to facilitate integration with GitHub
   - `.github/workflows` contains [GitHub Actions](https://github.com/features/actions) workflows for automating various processes in this repo (e.g. **Test** and **Lint** on push/PR to main, release-prep, hotfix-\*; **Publish** and **Bump Versions** manual dispatch; **CodeQL** for security)
   - `.github/assets/release-body.md` combined with a generated changelog becomes the body of [releases published using GitHub Actions](#publishing)
diff --git a/__mocks__/lexiconXmlContent.ts b/__mocks__/lexiconXmlContent.ts
new file mode 100644
index 0000000..8ba7cee
--- /dev/null
+++ b/__mocks__/lexiconXmlContent.ts
@@ -0,0 +1,9 @@
+/**
+ * @file Jest mock for webpack ?raw XML import. Exports the contents of test-data/Lexicon.xml
+ * so interlinearizer.web-view.tsx can parse it in unit tests without webpack.
+ */
+import fs from 'fs';
+import path from 'path';
+
+const xmlPath = path.join(__dirname, '..', 'test-data', 'Lexicon.xml');
+module.exports = fs.readFileSync(xmlPath, 'utf-8');
diff --git a/cspell.json b/cspell.json
index 4046bd8..fc570e0 100644
--- a/cspell.json
+++ b/cspell.json
@@ -8,6 +8,7 @@
     "node_modules",
     "package.json",
     "package-lock.json",
+    "test-data",
     "vscode-extension"
   ],
   "dictionaryDefinitions": [],
diff --git a/jest.config.ts b/jest.config.ts
index ef6987d..f8f9365 100644
--- a/jest.config.ts
+++ b/jest.config.ts
@@ -95,6 +95,8 @@ const config: Config = {
     '^(.+)\\.(scss|sass|css)\\?inline$': '<rootDir>/__mocks__/styleInlineMock.ts',
     /** Resolve webpack ?raw import for test XML in web-view. */
     '^(.+)/Interlinear_en_MAT\\.xml\\?raw$': '<rootDir>/__mocks__/interlinearXmlContent.ts',
+    /** Resolve webpack ?raw import for Lexicon XML in web-view. */
+    '^(.+)/Lexicon\\.xml\\?raw$': '<rootDir>/__mocks__/lexiconXmlContent.ts',
   },
 
   /** Exclude dist from module resolution to avoid Haste naming collision with root package.json. */
diff --git a/src/__tests__/interlinearizer.web-view.test.tsx b/src/__tests__/interlinearizer.web-view.test.tsx
index 33c6d1f..f436ed4 100644
--- a/src/__tests__/interlinearizer.web-view.test.tsx
+++ b/src/__tests__/interlinearizer.web-view.test.tsx
@@ -5,58 +5,44 @@
 import type { WebViewProps } from '@papi/core';
 import type { SerializedVerseRef } from '@sillsdev/scripture';
 import { act, fireEvent, render, screen, waitFor } from '@testing-library/react';
-import type { InterlinearData } from 'parsers/paratext-9/paratext-9-types';
+import * as lexiconParser from 'parsers/paratext-9/lexiconParser';
+import * as paratext9Parser from 'parsers/paratext-9/paratext9Parser';
+import * as paratext9Converter from 'parsers/paratext-9/paratext9Converter';
+import * as interlinearizerWebViewModule from '../interlinearizer.web-view';
 
-/** Stub InterlinearData returned by the mocked parser. Matches shape the WebView displays. */
-const stubInterlinearData: InterlinearData = {
-  glossLanguage: 'en',
-  bookId: 'MAT',
-  verses: {},
-};
+jest.mock('parsers/paratext-9/paratext9Parser');
+jest.mock('parsers/paratext-9/paratext9Converter');
+jest.mock('parsers/paratext-9/lexiconParser');
 
-/** Stub Interlinearization returned by the mocked converter. Matches shape the WebView displays. */
-const stubInterlinearization = {
-  id: 'mock-interlinear-id',
-  sourceWritingSystem: '',
-  analysisLanguages: ['en'],
-  books: [{ id: 'mock-book-id', bookRef: 'MAT', textVersion: '', segments: [] }],
+type ParserMock = typeof paratext9Parser & {
+  mockParse: jest.Mock;
+  stubInterlinearData: import('parsers/paratext-9/paratext-9-types').InterlinearData;
+};
+type ConverterMock = typeof paratext9Converter & {
+  mockConvert: jest.Mock;
+  mockCreateAnalyses: jest.Mock;
+  stubInterlinearization: Record<string, unknown>;
+  stubAnalysesMap: Map<string, unknown>;
 };
 
-const mockParse = jest.fn().mockReturnValue(stubInterlinearData);
-const mockConvert = jest.fn().mockResolvedValue(stubInterlinearization);
-
-/** Stub analyses map for Analyses view (ID → Analysis). */
-const stubAnalysesMap = new Map([
-  [
-    'analysis-en-lex1-s1',
-    {
-      id: 'analysis-en-lex1-s1',
-      analysisLanguage: 'en',
-      analysisType: 'gloss',
-      confidence: 'medium',
-      sourceSystem: 'paratext-9',
-      sourceUser: 'paratext-9-parser',
-      glossText: 'sense1',
-    },
-  ],
-]);
-const mockCreateAnalyses = jest.fn().mockReturnValue(stubAnalysesMap);
-
-/** Mock parser: no real XML parsing; returns stub data. Parser/converter are tested elsewhere. */
-jest.mock('parsers/paratext-9/paratext9Parser', () => ({
-  Paratext9Parser: jest.fn().mockImplementation(() => ({
-    parse: mockParse,
-  })),
-}));
-
-/** Mock converter: no real conversion; returns stub Interlinearization and stub analyses map. */
-jest.mock('parsers/paratext-9/paratext9Converter', () => ({
-  convertParatext9ToInterlinearization: mockConvert,
-  createAnalyses: mockCreateAnalyses,
-}));
-
-// eslint-disable-next-line import/first -- import order required for Jest mock initialization
-import * as interlinearizerWebViewModule from '../interlinearizer.web-view';
+function isParserMock(m: typeof paratext9Parser): m is ParserMock {
+  return 'mockParse' in m && 'stubInterlinearData' in m;
+}
+function isConverterMock(m: typeof paratext9Converter): m is ConverterMock {
+  return 'mockConvert' in m && 'stubInterlinearization' in m;
+}
+
+function getParserMock(): ParserMock {
+  if (!isParserMock(paratext9Parser)) throw new Error('Expected parser mock');
+  return paratext9Parser;
+}
+function getConverterMock(): ConverterMock {
+  if (!isConverterMock(paratext9Converter)) throw new Error('Expected converter mock');
+  return paratext9Converter;
+}
+
+const { stubInterlinearData, mockParse } = getParserMock();
+const { stubInterlinearization, mockConvert, mockCreateAnalyses } = getConverterMock();
 
 /**
  * Load the WebView module; it assigns the component to globalThis.webViewComponent. This pattern is
@@ -130,7 +116,7 @@ describe('InterlinearizerWebView', () => {
   it('renders the JSON view mode switch (InterlinearData / Interlinearization / Analyses)', async () => {
     await renderWebView();
 
-    const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+    const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
     expect(radiogroup).toBeInTheDocument();
     expect(screen.getByRole('radio', { name: /^interlineardata$/i })).toBeInTheDocument();
     expect(screen.getByRole('radio', { name: /^interlinearization$/i })).toBeInTheDocument();
@@ -201,7 +187,9 @@ describe('InterlinearizerWebView', () => {
     fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
 
     expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
-    expect(mockCreateAnalyses).toHaveBeenCalledWith(stubInterlinearData);
+    expect(mockCreateAnalyses).toHaveBeenCalledWith(stubInterlinearData, {
+      glossLookup: expect.any(Function),
+    });
     expect(screen.getByText(/analysis-en-lex1-s1/)).toBeInTheDocument();
     expect(screen.getByText(/glossText/i)).toBeInTheDocument();
     expect(screen.getByText(/paratext-9/i)).toBeInTheDocument();
@@ -222,6 +210,21 @@ describe('InterlinearizerWebView', () => {
     expect(jsonPre).not.toHaveTextContent('undefined');
   });
 
+  it('uses no glossary when Lexicon parse throws (glossLookup undefined)', async () => {
+    jest.mocked(lexiconParser.parseLexiconAndBuildGlossLookup).mockImplementationOnce(() => {
+      throw new Error('Invalid Lexicon XML');
+    });
+
+    await renderWebView();
+    fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
+
+    await waitFor(() => {
+      expect(mockCreateAnalyses).toHaveBeenCalledWith(stubInterlinearData, {
+        glossLookup: undefined,
+      });
+    });
+  });
+
   it('renders empty JSON pre when jsonToShow is undefined (converter returns undefined)', async () => {
     mockConvert.mockResolvedValueOnce(undefined);
 
@@ -297,7 +300,7 @@ describe('InterlinearizerWebView', () => {
   describe('handleJsonViewModeKeyDown', () => {
     it('ArrowRight moves to next mode and updates selection', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
       expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
 
       await act(async () => {
@@ -313,7 +316,7 @@ describe('InterlinearizerWebView', () => {
 
     it('ArrowDown moves to next mode', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
 
       await act(async () => {
         fireEvent.keyDown(radiogroup, { key: 'ArrowDown' });
@@ -328,7 +331,7 @@ describe('InterlinearizerWebView', () => {
 
     it('ArrowRight from last mode (Analyses) wraps to first (InterlinearData)', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
       fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
       expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
 
@@ -345,7 +348,7 @@ describe('InterlinearizerWebView', () => {
 
     it('ArrowLeft moves to previous mode', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
       fireEvent.click(screen.getByRole('radio', { name: /^analyses$/i }));
       expect(screen.getByText(/^Analyses \(JSON\):$/)).toBeInTheDocument();
 
@@ -362,7 +365,7 @@ describe('InterlinearizerWebView', () => {
 
     it('ArrowUp moves to previous mode', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
       fireEvent.click(screen.getByRole('radio', { name: /^interlinearization$/i }));
 
       await act(async () => {
@@ -378,7 +381,7 @@ describe('InterlinearizerWebView', () => {
 
     it('ArrowLeft from first mode (InterlinearData) wraps to last (Analyses)', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
       expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
 
       await act(async () => {
@@ -394,7 +397,7 @@ describe('InterlinearizerWebView', () => {
 
     it('non-arrow key does not change mode', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
       expect(screen.getByText(/^InterlinearData \(JSON\):$/)).toBeInTheDocument();
 
       fireEvent.keyDown(radiogroup, { key: 'a' });
@@ -408,7 +411,7 @@ describe('InterlinearizerWebView', () => {
 
     it('moves focus to the newly selected radio on arrow key', async () => {
       await renderWebView();
-      const radiogroup = screen.getByRole('radiogroup', { name: /json view mode/i });
+      const radiogroup = screen.getByRole('radiogroup', { name: /view json as:/i });
       const interlinearizationRadio = screen.getByRole('radio', {
         name: /^interlinearization$/i,
       });
diff --git a/src/__tests__/parsers/paratext-9/lexiconParser.test.ts b/src/__tests__/parsers/paratext-9/lexiconParser.test.ts
new file mode 100644
index 0000000..d5746ea
--- /dev/null
+++ b/src/__tests__/parsers/paratext-9/lexiconParser.test.ts
@@ -0,0 +1,269 @@
+/**
+ * @file Unit tests for {@link parseLexiconAndBuildGlossLookup}, {@link toArray}, and
+ *   {@link normalizeGloss}.
+ */
+
+import {
+  parseLexiconAndBuildGlossLookup,
+  toArray,
+  normalizeGloss,
+} from 'parsers/paratext-9/lexiconParser';
+import fs from 'fs';
+import { getTestDataPath } from '../../test-helpers';
+
+describe('normalizeGloss', () => {
+  it('returns default language and text when Gloss object has no @_Language (covers ?? branch)', () => {
+    const result = normalizeGloss({ '#text': 'gloss without lang key' });
+    expect(result.lang).toBe('*');
+    expect(result.text).toBe('gloss without lang key');
+  });
+
+  it('returns language and text when Gloss object has @_Language', () => {
+    const result = normalizeGloss({ '@_Language': 'en', '#text': 'hello' });
+    expect(result.lang).toBe('en');
+    expect(result.text).toBe('hello');
+  });
+
+  it('returns default language when Gloss is string', () => {
+    const result = normalizeGloss('plain string gloss');
+    expect(result.lang).toBe('*');
+    expect(result.text).toBe('plain string gloss');
+  });
+});
+
+describe('toArray', () => {
+  it('returns empty array for undefined (branch: undefined)', () => {
+    expect(toArray(undefined)).toEqual([]);
+  });
+
+  it('returns same array when value is already an array (branch: array)', () => {
+    const arr = [{ id: 'a' }];
+    expect(toArray(arr)).toBe(arr);
+    expect(toArray(arr)).toEqual([{ id: 'a' }]);
+  });
+
+  it('wraps single object in array when value is not an array (branch: single object)', () => {
+    const single = { id: 'single' };
+    expect(toArray(single)).toEqual([single]);
+  });
+});
+
+describe('parseLexiconAndBuildGlossLookup', () => {
+  it('throws when root element is not Lexicon', () => {
+    const xml = '<?xml version="1.0"?><InterlinearData></InterlinearData>';
+    expect(() => parseLexiconAndBuildGlossLookup(xml)).toThrow(
+      'Invalid XML: Missing Lexicon root element',
+    );
+  });
+
+  it('returns lookup that yields undefined for empty Lexicon', () => {
+    const xml = '<?xml version="1.0"?><Lexicon><Entries /></Lexicon>';
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('anyId', 'en')).toBeUndefined();
+  });
+
+  it('returns lookup that yields undefined for senseId with no Gloss', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="x" Homograph="1" />
+      <Entry>
+        <Sense Id="senseNoGloss" />
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('senseNoGloss', 'en')).toBeUndefined();
+  });
+
+  it('returns gloss text for matching senseId and language', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Stem" Form="hello" Homograph="1" />
+      <Entry>
+        <Sense Id="Fz1CNXo3">
+          <Gloss Language="en">good</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('Fz1CNXo3', 'en')).toBe('good');
+  });
+
+  it('returns empty string when Gloss element has no text for that language', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="in" Homograph="1" />
+      <Entry>
+        <Sense Id="6wa5ZOr2">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('6wa5ZOr2', 'grc')).toBe('');
+  });
+
+  it('returns undefined for wrong language when Sense has only other languages', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="d" Homograph="1" />
+      <Entry>
+        <Sense Id="wq/iyJMV">
+          <Gloss Language="hbo">בֹּקֶר</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('wq/iyJMV', 'hbo')).toBe('בֹּקֶר');
+    expect(lookup('wq/iyJMV', 'en')).toBeUndefined();
+  });
+
+  it('returns undefined for empty senseId', () => {
+    const xml = '<?xml version="1.0"?><Lexicon><Entries /></Lexicon>';
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('', 'en')).toBeUndefined();
+  });
+
+  it('adds no pairs for Sense with empty Id', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="x" Homograph="1" />
+      <Entry>
+        <Sense Id="">
+          <Gloss Language="en">ignored</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('', 'en')).toBeUndefined();
+    expect(lookup('any', 'en')).toBeUndefined();
+  });
+
+  it('adds no pairs for Sense with missing Id attribute', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="z" Homograph="1" />
+      <Entry>
+        <Sense>
+          <Gloss Language="en">no id sense</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('any', 'en')).toBeUndefined();
+  });
+
+  it('uses default language when Gloss has empty Language attribute', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="x" Homograph="1" />
+      <Entry>
+        <Sense Id="noLangSense">
+          <Gloss Language="">default gloss</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('noLangSense', '*')).toBe('default gloss');
+    expect(lookup('noLangSense', 'en')).toBe('default gloss');
+  });
+
+  it('uses default language when Gloss has no Language attribute (FXP returns string)', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="y" Homograph="1" />
+      <Entry>
+        <Sense Id="omitLangSense">
+          <Gloss>no lang attribute</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('omitLangSense', '*')).toBe('no lang attribute');
+    expect(lookup('omitLangSense', 'en')).toBe('no lang attribute');
+  });
+
+  it('uses default language when Gloss is object with missing Language attribute (covers ?? branch)', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="z" Homograph="1" />
+      <Entry>
+        <Sense Id="mixedLangSense">
+          <Gloss Language="en">en only</Gloss>
+          <Gloss>no lang key</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('mixedLangSense', 'en')).toBe('en only');
+    expect(lookup('mixedLangSense', '*')).toBe('no lang key');
+  });
+
+  it('handles Entry with no Sense', () => {
+    const xml = `
+<?xml version="1.0"?>
+<Lexicon>
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="x" Homograph="1" />
+      <Entry />
+    </item>
+  </Entries>
+</Lexicon>`;
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('any', 'en')).toBeUndefined();
+  });
+
+  it('parses test-data/Lexicon.xml and resolves known sense IDs', () => {
+    const xmlPath = getTestDataPath('Lexicon.xml');
+    const xml = fs.readFileSync(xmlPath, 'utf-8');
+    const lookup = parseLexiconAndBuildGlossLookup(xml);
+    expect(lookup('Fz1CNXo3', 'en')).toBe('good');
+    expect(lookup('OMK1KkbQ', 'pt')).toBe('World');
+    expect(lookup('0DCSOYfT', 'grc')).toBe('ωορλδ');
+  });
+});
diff --git a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
index f64a101..4edb4d1 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
@@ -733,5 +733,155 @@ describe('convertParatext9ToInterlinearization', () => {
       expect(result.has('analysis-en-Word:one-s1')).toBe(true);
       expect(result.has('analysis-en-Word:two-s2')).toBe(true);
     });
+
+    it('uses glossLookup when provided and returns gloss text instead of senseId placeholder', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 5 },
+                lexemes: [{ lexemeId: 'Word:hello', senseId: 'Fz1CNXo3' }],
+                lexemesId: 'Word:hello',
+                id: 'c1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const glossLookup = (senseId: string, lang: string): string | undefined =>
+        senseId === 'Fz1CNXo3' && lang === 'en' ? 'good' : undefined;
+      const result = createAnalyses(data, { glossLookup });
+
+      expect(result.size).toBe(1);
+      const analysis = result.get('analysis-en-Word:hello-Fz1CNXo3');
+      expect(analysis).toBeDefined();
+      expect(analysis?.glossText).toBe('good');
+    });
+
+    it('falls back to senseId when glossLookup returns undefined for that sense', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 3 },
+                lexemes: [{ lexemeId: 'Word:xyz', senseId: 'unknownSense' }],
+                lexemesId: 'Word:xyz',
+                id: 'c1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const glossLookup = (): string | undefined => undefined;
+      const result = createAnalyses(data, { glossLookup });
+
+      expect(result.size).toBe(1);
+      const analysis = result.get('analysis-en-Word:xyz-unknownSense');
+      expect(analysis).toBeDefined();
+      expect(analysis?.glossText).toBe('unknownSense');
+    });
+
+    it('uses empty string from glossLookup when Lexicon has blank gloss for sense+language', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'grc',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 2 },
+                lexemes: [{ lexemeId: 'Word:in', senseId: '6wa5ZOr2' }],
+                lexemesId: 'Word:in',
+                id: 'c1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const glossLookup = (senseId: string, lang: string): string | undefined =>
+        senseId === '6wa5ZOr2' && lang === 'grc' ? '' : undefined;
+      const result = createAnalyses(data, { glossLookup });
+
+      expect(result.size).toBe(1);
+      const analysis = result.get('analysis-grc-Word:in-6wa5ZOr2');
+      expect(analysis).toBeDefined();
+      expect(analysis?.glossText).toBe('');
+    });
+
+    it('uses senseId fallback when glossLookup is provided but lexeme.senseId is empty (else branch)', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 1 },
+                lexemes: [{ lexemeId: 'Word:a', senseId: '' }],
+                lexemesId: 'Word:a',
+                id: 'c1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const glossLookup = (): string | undefined => 'from-lexicon';
+      const result = createAnalyses(data, { glossLookup });
+
+      expect(result.size).toBe(1);
+      const analysis = result.get('analysis-en-Word:a');
+      expect(analysis).toBeDefined();
+      expect(analysis?.glossText).toBeUndefined();
+    });
+
+    it('uses lexicon gloss when lookup returns value and senseId when lookup returns undefined', () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 5 },
+                lexemes: [
+                  { lexemeId: 'Word:known', senseId: 'knownSense' },
+                  { lexemeId: 'Word:unknown', senseId: 'unknownSense' },
+                ],
+                lexemesId: 'Word:known/Word:unknown',
+                id: 'c1',
+                excluded: false,
+              },
+            ],
+            punctuations: [],
+          },
+        },
+      };
+      const glossLookup = (senseId: string): string | undefined =>
+        senseId === 'knownSense' ? 'from-lexicon' : undefined;
+      const result = createAnalyses(data, { glossLookup });
+
+      expect(result.size).toBe(2);
+      expect(result.get('analysis-en-Word:known-knownSense')?.glossText).toBe('from-lexicon');
+      expect(result.get('analysis-en-Word:unknown-unknownSense')?.glossText).toBe('unknownSense');
+    });
   });
 });
diff --git a/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
index ac9193d..b511ad5 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
@@ -591,18 +591,11 @@ describe('Paratext9Parser', () => {
       expect(firstCluster.textRange).toEqual({ index: 5, length: 5 });
       expect(firstCluster.lexemes[0]).toEqual({
         lexemeId: 'Word:hello',
-        senseId: 'WvbPwa9D',
+        senseId: 'JssW5c35',
       });
       expect(firstCluster.id).toMatch(/^Word:hello\/5-5$/);
 
-      const versesWithPunctuation = Object.values(result.verses).filter(
-        (v) => v.punctuations.length > 0,
-      );
-      expect(versesWithPunctuation.length).toBeGreaterThan(0);
-      const [firstWithPunctuation] = versesWithPunctuation;
-      expect(firstWithPunctuation.punctuations[0]).toHaveProperty('textRange');
-      expect(firstWithPunctuation.punctuations[0]).toHaveProperty('beforeText');
-      expect(firstWithPunctuation.punctuations[0]).toHaveProperty('afterText');
+      expect(Object.values(result.verses).every((v) => Array.isArray(v.punctuations))).toBe(true);
     });
   });
 
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index 5762a73..29af712 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -5,10 +5,16 @@ import {
   convertParatext9ToInterlinearization,
   createAnalyses,
 } from 'parsers/paratext-9/paratext9Converter';
+import { parseLexiconAndBuildGlossLookup } from 'parsers/paratext-9/lexiconParser';
 
 import type { Interlinearization } from 'interlinearizer';
 /** Test interlinear XML bundled at build time (from test-data/Interlinear_en_MAT.xml). */
 import testXml from '../test-data/Interlinear_en_MAT.xml?raw';
+/**
+ * Lexicon XML for gloss text lookup (test-data/Lexicon.xml). Parsed once; on failure we use no
+ * glossary.
+ */
+import lexiconXml from '../test-data/Lexicon.xml?raw';
 
 /** Result of parsing the bundled test XML: either data or an error message. */
 type ParseResult = { data: InterlinearData; error: undefined } | { data: undefined; error: string };
@@ -159,8 +165,20 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
     };
   }, [parsed]);
 
+  /** Gloss lookup from Lexicon (senseId, language) → text. Built once; invalid Lexicon is ignored. */
+  const glossLookup = useMemo(() => {
+    try {
+      return parseLexiconAndBuildGlossLookup(lexiconXml);
+    } catch {
+      return undefined;
+    }
+  }, []);
+
   /** Analyses map derived from parsed data (ID → Analysis); only defined when parsed exists. */
-  const analysesMap = useMemo(() => (parsed ? createAnalyses(parsed) : undefined), [parsed]);
+  const analysesMap = useMemo(
+    () => (parsed ? createAnalyses(parsed, { glossLookup: glossLookup ?? undefined }) : undefined),
+    [parsed, glossLookup],
+  );
 
   /**
    * Data to show as JSON: depends on selected view mode. Shows converting sentinel when in
@@ -195,11 +213,16 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
       {parsed && (
         <>
           <div className="tw-flex tw-flex-wrap tw-items-center tw-gap-2">
-            <span className="tw-text-sm tw-font-medium tw-text-foreground">View JSON as:</span>
+            <span
+              id="interlinearizer-json-view-mode-label"
+              className="tw-text-sm tw-font-medium tw-text-foreground"
+            >
+              View JSON as:
+            </span>
             <div
               className="tw-inline-flex tw-rounded-md tw-border tw-border-border tw-bg-muted tw-p-0.5"
               role="radiogroup"
-              aria-label="JSON view mode"
+              aria-labelledby="interlinearizer-json-view-mode-label"
               tabIndex={-1}
               onKeyDown={onJsonViewModeKeyDown}
             >
diff --git a/src/parsers/paratext-9/__mocks__/lexiconParser.ts b/src/parsers/paratext-9/__mocks__/lexiconParser.ts
new file mode 100644
index 0000000..89f2cac
--- /dev/null
+++ b/src/parsers/paratext-9/__mocks__/lexiconParser.ts
@@ -0,0 +1,10 @@
+/**
+ * @file Jest manual mock for parsers/paratext-9/lexiconParser. Placed adjacent to the module so
+ * jest.mock('parsers/paratext-9/lexiconParser') picks it up automatically. Used by
+ * interlinearizer.web-view tests so the WebView does not run real conversion.
+ */
+
+/** Stub lookup: (senseId, language) => undefined. Matches LexiconGlossLookup shape. */
+const stubGlossLookup = (_senseId: string, _language: string): string | undefined => undefined;
+
+export const parseLexiconAndBuildGlossLookup = jest.fn().mockReturnValue(stubGlossLookup);
diff --git a/src/parsers/paratext-9/__mocks__/paratext9Converter.ts b/src/parsers/paratext-9/__mocks__/paratext9Converter.ts
new file mode 100644
index 0000000..aa76111
--- /dev/null
+++ b/src/parsers/paratext-9/__mocks__/paratext9Converter.ts
@@ -0,0 +1,35 @@
+/**
+ * @file Jest manual mock for parsers/paratext-9/paratext9Converter. Placed adjacent to the module so
+ * jest.mock('parsers/paratext-9/paratext9Converter') picks it up automatically. Used by
+ * interlinearizer.web-view tests so the WebView does not run real conversion.
+ */
+
+/** Stub Interlinearization returned by mockConvert. Matches shape the WebView displays. */
+export const stubInterlinearization = {
+  id: 'mock-interlinear-id',
+  sourceWritingSystem: '',
+  analysisLanguages: ['en'],
+  books: [{ id: 'mock-book-id', bookRef: 'MAT', textVersion: '', segments: [] }],
+};
+
+/** Stub analyses map for Analyses view (ID → Analysis). */
+export const stubAnalysesMap = new Map([
+  [
+    'analysis-en-lex1-s1',
+    {
+      id: 'analysis-en-lex1-s1',
+      analysisLanguage: 'en',
+      analysisType: 'gloss',
+      confidence: 'medium',
+      sourceSystem: 'paratext-9',
+      sourceUser: 'paratext-9-parser',
+      glossText: 'sense1',
+    },
+  ],
+]);
+
+export const mockConvert = jest.fn().mockResolvedValue(stubInterlinearization);
+export const mockCreateAnalyses = jest.fn().mockReturnValue(stubAnalysesMap);
+
+export const convertParatext9ToInterlinearization = mockConvert;
+export const createAnalyses = mockCreateAnalyses;
diff --git a/src/parsers/paratext-9/__mocks__/paratext9Parser.ts b/src/parsers/paratext-9/__mocks__/paratext9Parser.ts
new file mode 100644
index 0000000..33102bc
--- /dev/null
+++ b/src/parsers/paratext-9/__mocks__/paratext9Parser.ts
@@ -0,0 +1,20 @@
+/**
+ * @file Jest manual mock for parsers/paratext-9/paratext9Parser. Placed adjacent to the module so
+ * jest.mock('parsers/paratext-9/paratext9Parser') picks it up automatically. Used by
+ * interlinearizer.web-view tests so the WebView does not run real XML parsing.
+ */
+
+import type { InterlinearData } from '../paratext-9-types';
+
+/** Stub InterlinearData returned by mockParse. Matches shape the WebView displays. */
+export const stubInterlinearData: InterlinearData = {
+  glossLanguage: 'en',
+  bookId: 'MAT',
+  verses: {},
+};
+
+export const mockParse = jest.fn().mockReturnValue(stubInterlinearData);
+
+export const Paratext9Parser = jest.fn().mockImplementation(() => ({
+  parse: mockParse,
+}));
diff --git a/src/parsers/paratext-9/lexiconParser.ts b/src/parsers/paratext-9/lexiconParser.ts
new file mode 100644
index 0000000..dce95e7
--- /dev/null
+++ b/src/parsers/paratext-9/lexiconParser.ts
@@ -0,0 +1,184 @@
+/**
+ * @file Parses Paratext 9 Lexicon XML and builds a gloss lookup for use in PT9 → interlinearizer
+ *   conversion. Interlinear XML references senses by GlossId (Sense Id); the Lexicon stores gloss
+ *   text per Sense and language in <Gloss Language="...">. This module provides a (senseId,
+ *   language) → glossText lookup so {@link createAnalyses} can fill in glossText instead of
+ *   placeholders.
+ */
+
+import { X2jOptions, XMLParser } from 'fast-xml-parser';
+
+/** Separator used in the internal map key (senseId + language). */
+const GLOSS_KEY_SEP = '\t';
+
+/** Language used in Lexicon when no Language attribute is set; used as fallback in lookup. */
+const DEFAULT_LANGUAGE = '*';
+
+/**
+ * Lookup function: (senseId, language) → gloss text when present in the Lexicon. Return value is
+ * trimmed; empty string is returned for missing or blank glosses when the sense exists, so callers
+ * can distinguish "no entry" (undefined) from "entry with no text" ("").
+ */
+export type LexiconGlossLookup = (senseId: string, language: string) => string | undefined;
+
+/** Parsed Gloss element: Language attribute and text content. */
+interface ParsedGloss {
+  ['@_Language']?: string;
+  ['#text']?: string;
+}
+
+/** Parsed Sense element: Id attribute and zero or more Gloss children. */
+interface ParsedSense {
+  ['@_Id']?: string;
+  Gloss?: ParsedGloss | string | (ParsedGloss | string)[];
+}
+
+/** Parsed Entry: zero or more Sense children. */
+interface ParsedEntry {
+  Sense?: ParsedSense | ParsedSense[];
+}
+
+/** Parsed Lexicon item: Lexeme and Entry. */
+interface ParsedLexiconItem {
+  Lexeme?: { ['@_Type']?: string; ['@_Form']?: string; ['@_Homograph']?: string };
+  Entry?: ParsedEntry;
+}
+
+/** Root Lexicon element. */
+interface ParsedLexiconRoot {
+  Language?: string;
+  Entries?: { item?: ParsedLexiconItem | ParsedLexiconItem[] };
+}
+
+/** Full document: Lexicon root. */
+interface ParsedLexiconXml {
+  Lexicon?: ParsedLexiconRoot;
+}
+
+/**
+ * Normalizes a possibly-array, possibly-undefined value to an array. Used for parser output where a
+ * single child is an object and multiple children are an array.
+ *
+ * @param value - Single item, array of items, or undefined.
+ * @returns Empty array if undefined, otherwise the array (or single item wrapped in an array).
+ * @internal Exported for unit-test coverage of the single-object branch (FXP with isArray always returns arrays).
+ */
+export function toArray<T>(value: T | T[] | undefined): T[] {
+  if (value === undefined) return [];
+  return Array.isArray(value) ? value : [value];
+}
+
+/**
+ * Builds the internal map key for a (senseId, language) pair. Must match the key used when
+ * populating the gloss map.
+ *
+ * @param senseId - Sense Id (GlossId from Interlinear XML).
+ * @param language - Gloss language code.
+ * @returns Opaque key string.
+ */
+function glossKey(senseId: string, language: string): string {
+  return `${senseId}${GLOSS_KEY_SEP}${language}`;
+}
+
+/**
+ * Normalizes a single Gloss item from the parser into language and text.
+ *
+ * @param gloss - Single Gloss from ParsedSense.Gloss (object or string).
+ * @returns Trimmed language (or {@link DEFAULT_LANGUAGE} when missing) and trimmed text.
+ * @internal Exported so tests can cover the object branch when @_Language is undefined (parser
+ *   may return a string for single Gloss with no attributes, so that branch is not reachable via XML).
+ */
+export function normalizeGloss(gloss: ParsedGloss | string): { lang: string; text: string } {
+  if (typeof gloss === 'string') {
+    return { lang: DEFAULT_LANGUAGE, text: gloss };
+  }
+  const lang = String(gloss['@_Language'] ?? '') || DEFAULT_LANGUAGE;
+  const text = String(gloss['#text'] ?? '');
+  return { lang, text };
+}
+
+/**
+ * Extracts (key, text) pairs from a single Sense: one pair per Gloss child.
+ *
+ * @param sense - Parsed Sense element.
+ * @returns Zero or more { key, text } objects; senseId comes from Sense Id, language from Gloss.
+ */
+function glossPairsFromSense(sense: ParsedSense): Array<{ key: string; text: string }> {
+  const senseId = sense['@_Id'] ?? '';
+  if (!senseId) return [];
+
+  const glosses = toArray(sense.Gloss);
+  return glosses.map((g) => {
+    const { lang, text } = normalizeGloss(g);
+    return { key: glossKey(senseId, lang), text };
+  });
+}
+
+/**
+ * Extracts (key, text) pairs from a single Lexicon item (one Entry with zero or more Senses).
+ *
+ * @param item - Parsed Entries.item element.
+ * @returns Zero or more { key, text } objects.
+ */
+function glossPairsFromItem(item: ParsedLexiconItem): Array<{ key: string; text: string }> {
+  const entry = item.Entry;
+  if (!entry) return [];
+
+  return toArray(entry.Sense).flatMap(glossPairsFromSense);
+}
+
+/**
+ * Builds a gloss lookup map from parsed Lexicon entries. Iterates all Entries.item → Entry → Sense
+ * → Gloss and indexes by (senseId, language). Later entries overwrite earlier ones for the same
+ * key.
+ *
+ * @param root - Parsed Lexicon root (Lexicon element).
+ * @returns Map keyed by glossKey(senseId, language) to trimmed gloss text (empty string allowed).
+ */
+function buildGlossMap(root: ParsedLexiconRoot): Map<string, string> {
+  const items = toArray(root.Entries?.item);
+  const pairs = items.flatMap(glossPairsFromItem);
+  return new Map(pairs.map(({ key, text }) => [key, text]));
+}
+
+/**
+ * Parses a Paratext 9 Lexicon XML string and returns a lookup function that returns gloss text for
+ * a given (senseId, language). The Sense Id in the Lexicon matches the GlossId used in Interlinear
+ * XML; the language should match the interlinear's GlossLanguage when resolving word-level
+ * glosses.
+ *
+ * @param xml - Raw Lexicon XML string (e.g. file contents).
+ * @returns A {@link LexiconGlossLookup} that returns the trimmed gloss string when the Lexicon has a
+ *   matching Sense and Gloss for that language, or undefined when no such entry exists. Returns the
+ *   empty string when the Lexicon has a Sense+Language entry but the gloss text is blank.
+ * @throws {Error} If the root element is not Lexicon.
+ */
+export function parseLexiconAndBuildGlossLookup(xml: string): LexiconGlossLookup {
+  const arrayPaths = new Set([
+    'Lexicon.Entries.item',
+    'Lexicon.Entries.item.Entry.Sense',
+    'Lexicon.Entries.item.Entry.Sense.Gloss',
+  ]);
+  const options: Partial<X2jOptions> = {
+    ignoreAttributes: false,
+    attributeNamePrefix: '@_',
+    ignoreDeclaration: true,
+    ignorePiTags: true,
+    trimValues: false,
+    parseTagValue: false,
+    isArray: (_tagName, jPath) => arrayPaths.has(jPath),
+  };
+  const parser = new XMLParser(options);
+  const parsed: ParsedLexiconXml = parser.parse(xml);
+  const root = parsed.Lexicon;
+  if (!root) {
+    throw new Error('Invalid XML: Missing Lexicon root element');
+  }
+  const map = buildGlossMap(root);
+  return (senseId: string, language: string): string | undefined => {
+    if (!senseId) return undefined;
+    const exact = map.get(glossKey(senseId, language));
+    if (exact !== undefined) return exact;
+    return map.get(glossKey(senseId, DEFAULT_LANGUAGE));
+  };
+}
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
index 238ba28..a36014e 100644
--- a/src/parsers/paratext-9/paratext9Converter.ts
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -20,7 +20,14 @@ import {
   AssignmentStatus,
   Confidence,
 } from 'types/interlinearizer-enums';
-import type { InterlinearData, VerseData, StringRange } from './paratext-9-types';
+import type {
+  InterlinearData,
+  VerseData,
+  StringRange,
+  ClusterData,
+  PunctuationData,
+} from './paratext-9-types';
+import type { LexiconGlossLookup } from './lexiconParser';
 
 /**
  * Default SHA-256 hex implementation using the Web Crypto API so the converter can run in WebViews.
@@ -164,8 +171,14 @@ function textRangeToAnchor(textRange: StringRange): string {
  * @param verseRef - Verse reference (e.g., "MAT 1:1").
  * @param verseData - Verse data from Paratext 9.
  * @param glossLanguage - Gloss language code.
- * @returns A Segment with occurrences converted from clusters and punctuations.
+ * @returns A Segment with occurrences in text order (clusters and punctuations merged and sorted by
+ *   textRange.index, then mapped to occurrences with sequential index).
  */
+/** Item in the merged list of clusters and punctuations for reading-order sort. */
+type ClusterOrPunctuation =
+  | { kind: 'cluster'; textRange: StringRange; cluster: ClusterData }
+  | { kind: 'punctuation'; textRange: StringRange; punctuation: PunctuationData };
+
 function convertVerseToSegment(
   verseRef: string,
   verseData: VerseData,
@@ -173,49 +186,61 @@ function convertVerseToSegment(
 ): Segment {
   const segmentId = generateSegmentId(verseRef);
 
-  const wordOccurrences = verseData.clusters.map((cluster, clusterIndex): Occurrence => {
-    const occurrenceId = generateOccurrenceIdFromCluster(segmentId, cluster.id, clusterIndex);
-    const assignments = cluster.lexemes.map((lexeme): AnalysisAssignment => {
-      const analysisId = generateAnalysisId(lexeme.lexemeId, lexeme.senseId, glossLanguage);
-      const assignmentId = generateAssignmentId(occurrenceId, analysisId);
+  const items: ClusterOrPunctuation[] = [
+    ...verseData.clusters.map(
+      (cluster): ClusterOrPunctuation => ({
+        kind: 'cluster',
+        textRange: cluster.textRange,
+        cluster,
+      }),
+    ),
+    ...verseData.punctuations.map(
+      (punctuation): ClusterOrPunctuation => ({
+        kind: 'punctuation',
+        textRange: punctuation.textRange,
+        punctuation,
+      }),
+    ),
+  ].sort((a, b) => a.textRange.index - b.textRange.index);
+
+  const occurrences: Occurrence[] = items.map((item, occurrenceIndex): Occurrence => {
+    if (item.kind === 'cluster') {
+      const { cluster } = item;
+      const occurrenceId = generateOccurrenceIdFromCluster(segmentId, cluster.id, occurrenceIndex);
+      const assignments = cluster.lexemes.map((lexeme): AnalysisAssignment => {
+        const analysisId = generateAnalysisId(lexeme.lexemeId, lexeme.senseId, glossLanguage);
+        const assignmentId = generateAssignmentId(occurrenceId, analysisId);
+        return {
+          id: assignmentId,
+          occurrenceId,
+          analysisId,
+          status: verseData.hash ? AssignmentStatus.Approved : AssignmentStatus.Suggested,
+        };
+      });
       return {
-        id: assignmentId,
-        occurrenceId,
-        analysisId,
-        status: verseData.hash ? AssignmentStatus.Approved : AssignmentStatus.Suggested,
+        id: occurrenceId,
+        segmentId,
+        index: occurrenceIndex,
+        anchor: textRangeToAnchor(cluster.textRange),
+        surfaceText: '', // Paratext 9 doesn't specify surface text per cluster
+        writingSystem: '', // Paratext 9 doesn't specify writing system per cluster
+        type: OccurrenceType.Word,
+        assignments,
       };
-    });
+    }
+    const { punctuation } = item;
     return {
-      id: occurrenceId,
+      id: generateOccurrenceIdFromPunctuation(segmentId, punctuation.textRange, occurrenceIndex),
       segmentId,
-      index: clusterIndex,
-      anchor: textRangeToAnchor(cluster.textRange),
-      surfaceText: '', // Paratext 9 doesn't specify surface text per cluster
-      writingSystem: '', // Paratext 9 doesn't specify writing system per cluster
-      type: OccurrenceType.Word,
-      assignments,
+      index: occurrenceIndex,
+      anchor: textRangeToAnchor(punctuation.textRange),
+      surfaceText: punctuation.afterText || punctuation.beforeText || '',
+      writingSystem: '',
+      type: OccurrenceType.Punctuation,
+      assignments: [],
     };
   });
 
-  const punctuationOccurrences: Occurrence[] = verseData.punctuations.map(
-    (punctuation, puncIndex): Occurrence => {
-      const occurrenceIndex = wordOccurrences.length + puncIndex;
-
-      return {
-        id: generateOccurrenceIdFromPunctuation(segmentId, punctuation.textRange, occurrenceIndex),
-        segmentId,
-        index: occurrenceIndex,
-        anchor: textRangeToAnchor(punctuation.textRange),
-        surfaceText: punctuation.afterText || punctuation.beforeText || '',
-        writingSystem: '',
-        type: OccurrenceType.Punctuation,
-        assignments: [],
-      };
-    },
-  );
-
-  const occurrences = [...wordOccurrences, ...punctuationOccurrences];
-
   return {
     id: segmentId,
     segmentRef: verseRef,
@@ -225,14 +250,36 @@ function convertVerseToSegment(
 }
 
 /**
- * Creates Analysis objects for all unique lexemes across all verses.
+ * Options for {@link createAnalyses}. When a Lexicon is available, pass a gloss lookup so glossText
+ * is populated from the Lexicon instead of using senseId as a placeholder.
+ */
+export type CreateAnalysesOptions = {
+  /**
+   * Lookup (senseId, language) → gloss text. When provided and returns a string (including empty
+   * string), that value is used for Analysis.glossText; otherwise glossText falls back to senseId
+   * when present (placeholder behaviour). Built from Lexicon XML via
+   * {@link parseLexiconAndBuildGlossLookup}.
+   */
+  glossLookup?: LexiconGlossLookup;
+};
+
+/**
+ * Creates Analysis objects for all unique lexemes across all verses. When
+ * {@link CreateAnalysesOptions.glossLookup} is provided, gloss text is resolved from the Lexicon
+ * (senseId + glossLanguage); otherwise glossText uses senseId as a placeholder when Interlinear XML
+ * does not store gloss strings.
  *
  * @param interlinearData - Paratext 9 interlinear data.
+ * @param options - Optional. glossLookup: (senseId, language) → gloss text from Lexicon.
  * @returns Map of analysis ID to Analysis object.
  */
-export function createAnalyses(interlinearData: InterlinearData): Map<string, Analysis> {
+export function createAnalyses(
+  interlinearData: InterlinearData,
+  options?: CreateAnalysesOptions,
+): Map<string, Analysis> {
   const analyses = new Map<string, Analysis>();
   const { glossLanguage } = interlinearData;
+  const glossLookup = options?.glossLookup;
 
   Object.values(interlinearData.verses).forEach((verseData) => {
     verseData.clusters.forEach((cluster) => {
@@ -240,6 +287,14 @@ export function createAnalyses(interlinearData: InterlinearData): Map<string, An
         const analysisId = generateAnalysisId(lexeme.lexemeId, lexeme.senseId, glossLanguage);
 
         if (!analyses.has(analysisId)) {
+          let glossText: string | undefined;
+          if (glossLookup && lexeme.senseId) {
+            const fromLexicon = glossLookup(lexeme.senseId, glossLanguage);
+            glossText = fromLexicon !== undefined ? fromLexicon : lexeme.senseId;
+          } else {
+            glossText = lexeme.senseId || undefined;
+          }
+
           const analysis: Analysis = {
             id: analysisId,
             analysisLanguage: glossLanguage,
@@ -247,7 +302,7 @@ export function createAnalyses(interlinearData: InterlinearData): Map<string, An
             confidence: Confidence.Medium, // Default confidence level
             sourceSystem: 'paratext-9',
             sourceUser: 'paratext-9-parser',
-            glossText: lexeme.senseId || undefined, // Use senseId as gloss text placeholder
+            glossText,
             // Note: Paratext 9 doesn't provide POS, features, or morpheme bundles in the XML
           };
 
diff --git a/src/parsers/paratext-9/pt9-xml.md b/src/parsers/paratext-9/pt9-xml.md
index 6c8cd0a..5085569 100644
--- a/src/parsers/paratext-9/pt9-xml.md
+++ b/src/parsers/paratext-9/pt9-xml.md
@@ -1,6 +1,8 @@
 # Paratext 9 XML schema
 
-The extension reads PT9 interlinear data from XML files (e.g. `Interlinear_<lang>_<book>.xml` in project data). The parser in `src/parsers/interlinearXmlParser.ts` expects the following structure. Sample files live in `test-data/` (e.g. `Interlinear_en_MAT.xml`).
+The extension reads PT9 interlinear data from XML files (e.g. `Interlinear_<lang>_<book>.xml` in project data). The parser in `src/parsers/paratext-9/paratext9Parser.ts` expects the following structure. Sample files live in `test-data/` (e.g. `Interlinear_en_MAT.xml`).
+
+Interlinear XML does **not** store gloss strings; it only references senses by `GlossId` (which corresponds to Sense Id in the Lexicon). To populate `glossText` on the interlinearizer model, the extension can load a Paratext 9 **Lexicon** XML file (`Lexicon.xml`). The Lexicon parser (`src/parsers/paratext-9/lexiconParser.ts`) builds a (senseId, language) → gloss text lookup; `createAnalyses` in `paratext9Converter` accepts an optional `glossLookup` so analyses get real gloss text when the Lexicon is available.
 
 ## Document structure
 
@@ -115,3 +117,21 @@ This example shows optional root attributes, verse `Hash`, multiple verses and c
   </Verses>
 </InterlinearData>
 ```
+
+## Lexicon XML (gloss text lookup)
+
+The Lexicon file (`Lexicon.xml`) provides gloss text per Sense and language. Structure:
+
+- **Root element:** `Lexicon`
+  - **Child:** `Entries` containing `item` elements (one per lexicon entry).
+- **`item`**
+  - **`Lexeme`** (optional): Attributes `Type`, `Form`, `Homograph` (for reference; not used for lookup).
+  - **`Entry`**: Contains **`Sense`** elements.
+- **`Sense`**
+  - **Attribute:** `Id` (required). This Id is the same as `GlossId` in Interlinear XML.
+  - **Children:** One or more **`Gloss`** elements.
+- **`Gloss`**
+  - **Attribute:** `Language` (e.g. `"en"`, `"hbo"`, `"grc"`). The gloss language in InterlinearData should match when resolving word-level glosses.
+  - **Text content:** The gloss string (may be empty).
+
+The converter uses `parseLexiconAndBuildGlossLookup(xml)` to build a function `(senseId, language) => glossText`. Pass that function as `createAnalyses(interlinearData, { glossLookup })` so `Analysis.glossText` is set from the Lexicon instead of the senseId placeholder.
diff --git a/test-data/Interlinear_en_MAT.xml b/test-data/Interlinear_en_MAT.xml
index 1841e16..14fd613 100644
--- a/test-data/Interlinear_en_MAT.xml
+++ b/test-data/Interlinear_en_MAT.xml
@@ -6,91 +6,91 @@
       <VerseData Hash="C8D38188">
         <Cluster>
           <Range Index="5" Length="5" />
-          <Lexeme Id="Word:hello" GlossId="WvbPwa9D" />
+          <Lexeme Id="Word:hello" GlossId="JssW5c35" />
         </Cluster>
         <Cluster>
           <Range Index="19" Length="3" />
-          <Lexeme Id="Word:abe" GlossId="Tb8zZwRA" />
+          <Lexeme Id="Word:abe" GlossId="4OhxMqdn" />
         </Cluster>
         <Cluster>
           <Range Index="83" Length="2" />
-          <Lexeme Id="Word:oj" GlossId="U1UrGv3+" />
+          <Lexeme Id="Word:oj" GlossId="4icWQ3pK" />
         </Cluster>
         <Cluster>
           <Range Index="5" Length="5" />
-          <Lexeme Id="Stem:hello" GlossId="F2N3/zBr" />
-          <Lexeme Id="Suffix:ing" GlossId="xk9pREWs" />
+          <Lexeme Id="Stem:hello" GlossId="Fz1CNXo3" />
+          <Lexeme Id="Suffix:ing" GlossId="iF7p009J" />
         </Cluster>
         <Cluster>
           <Range Index="11" Length="7" />
-          <Lexeme Id="Word:aokaybe" GlossId="4Pe8BpyK" />
+          <Lexeme Id="Word:aokaybe" GlossId="MrxUQ/f7" />
         </Cluster>
         <Cluster>
           <Range Index="19" Length="3" />
-          <Lexeme Id="Stem:ab" GlossId="EsD21Y1W" />
-          <Lexeme Id="Suffix:e" GlossId="IIAUh20h" />
+          <Lexeme Id="Stem:ab" GlossId="zYttwqJ8" />
+          <Lexeme Id="Suffix:e" GlossId="hfa5f0+E" />
         </Cluster>
         <Cluster>
           <Range Index="23" Length="3" />
-          <Lexeme Id="Stem:abc" GlossId="tnuwKEq5" />
+          <Lexeme Id="Stem:abc" GlossId="jtoPryEQ" />
         </Cluster>
         <Cluster>
           <Range Index="23" Length="3" />
-          <Lexeme Id="Word:abc" GlossId="ZDzsb3Te" />
+          <Lexeme Id="Word:abc" GlossId="igUFw9xK" />
         </Cluster>
         <Cluster>
           <Range Index="41" Length="4" />
-          <Lexeme Id="Stem:this" GlossId="h/+ljGCH" />
-          <Lexeme Id="Suffix:sd" GlossId="7S6gLi8t" />
+          <Lexeme Id="Stem:this" GlossId="HjO9AEIv" />
+          <Lexeme Id="Suffix:sd" GlossId="WekF5Iii" />
         </Cluster>
         <Cluster>
           <Range Index="41" Length="4" />
-          <Lexeme Id="Word:this" GlossId="CxS53FaX" />
+          <Lexeme Id="Word:this" GlossId="YlAzyGzv" />
         </Cluster>
         <Cluster>
           <Range Index="46" Length="2" />
-          <Lexeme Id="Word:is" GlossId="2H3/ch0V" />
+          <Lexeme Id="Stem:is" GlossId="4ir1SX+t" />
+        </Cluster>
+        <Cluster>
+          <Range Index="46" Length="2" />
+          <Lexeme Id="Word:is" GlossId="oLsTdKko" />
         </Cluster>
         <Cluster>
           <Range Index="49" Length="1" />
-          <Lexeme Id="Stem:aaaa" GlossId="8T8fEabg" />
+          <Lexeme Id="Stem:aaaa" GlossId="wm5VNwsv" />
         </Cluster>
         <Cluster>
           <Range Index="49" Length="1" />
-          <Lexeme Id="Word:a" GlossId="oYgiMTR8" />
+          <Lexeme Id="Word:a" GlossId="yp9hjBeA" />
         </Cluster>
         <Cluster>
-          <Range Index="51" Length="8" />
-          <Lexeme Id="Word:footnote" GlossId="qDB51qCg" />
+          <Range Index="65" Length="1" />
+          <Lexeme Id="Word:a" GlossId="yp9hjBeA" />
         </Cluster>
         <Cluster>
-          <Range Index="60" Length="4" />
-          <Lexeme Id="Word:with" GlossId="7fAcNv8C" />
+          <Range Index="51" Length="8" />
+          <Lexeme Id="Word:footnote" GlossId="MkkdFznP" />
         </Cluster>
         <Cluster>
-          <Range Index="65" Length="1" />
-          <Lexeme Id="Word:a" GlossId="oYgiMTR8" />
+          <Range Index="60" Length="4" />
+          <Lexeme Id="Word:with" GlossId="mm9EzY7G" />
         </Cluster>
         <Cluster>
           <Range Index="67" Length="4" />
-          <Lexeme Id="Word:note" GlossId="BRp+Nb8F" />
+          <Lexeme Id="Word:note" GlossId="ddMG/pnJ" />
         </Cluster>
         <Cluster>
           <Range Index="75" Length="4" />
-          <Lexeme Id="Word:تمان" GlossId="1ziNpgpc" />
+          <Lexeme Id="Word:تمان" GlossId="JA1+30zD" />
         </Cluster>
         <Cluster>
           <Range Index="83" Length="2" />
-          <Lexeme Id="Prefix:o" GlossId="4Eo0Jh1g" />
-          <Lexeme Id="Stem:j" GlossId="uJUjtcMg" />
-        </Cluster>
-        <Cluster>
-          <Range Index="46" Length="2" />
-          <Lexeme Id="Stem:is" GlossId="QEYHInCl" />
+          <Lexeme Id="Prefix:o" GlossId="ceRCYAvD" />
+          <Lexeme Id="Stem:j" GlossId="TKqdnOs4" />
         </Cluster>
         <Cluster>
           <Range Index="65" Length="1" />
-          <Lexeme Id="Stem:aaaa" GlossId="8T8fEabg" />
+          <Lexeme Id="Stem:aaaa" GlossId="wm5VNwsv" />
         </Cluster>
       </VerseData>
     </item>
@@ -99,12 +99,12 @@
       <VerseData Hash="5873E7B7">
         <Cluster>
           <Range Index="5" Length="6" />
-          <Lexeme Id="Stem:Dearl" GlossId="dMqiq7uQ" />
-          <Lexeme Id="Suffix:y" GlossId="QyybcQB0" />
+          <Lexeme Id="Word:dearly" GlossId="eDwbL8iD" />
         </Cluster>
         <Cluster>
           <Range Index="5" Length="6" />
-          <Lexeme Id="Word:dearly" GlossId="BGgpOBGL" />
+          <Lexeme Id="Stem:Dearl" GlossId="giYjyUr7" />
+          <Lexeme Id="Suffix:y" GlossId="z+TVrr/P" />
         </Cluster>
       </VerseData>
     </item>
@@ -174,81 +174,81 @@
     </item>
     <item>
       <string>MAT 1:3</string>
-      <VerseData Hash="0E1567F7">
+      <VerseData>
         <Cluster>
           <Range Index="5" Length="4" />
-          <Lexeme Id="Stem:ok" GlossId="8U81VqPJ" />
-          <Lexeme Id="Suffix:a" GlossId="x4cYluTO" />
-          <Lexeme Id="Suffix:y" GlossId="QQS7ePhM" />
+          <Lexeme Id="Word:okay" GlossId="m/dJp1PU" />
         </Cluster>
         <Cluster>
           <Range Index="5" Length="4" />
-          <Lexeme Id="Word:okay" GlossId="Skw2n0L/" />
+          <Lexeme Id="Stem:ok" GlossId="4HerhP/k" />
+          <Lexeme Id="Suffix:a" GlossId="m2z9yYHN" />
+          <Lexeme Id="Suffix:y" GlossId="z+TVrr/P" />
         </Cluster>
         <Cluster>
           <Range Index="10" Length="1" />
-          <Lexeme Id="Word:x" GlossId="1l25a1tM" />
+          <Lexeme Id="Word:x" GlossId="guH28APY" />
         </Cluster>
       </VerseData>
     </item>
     <item>
       <string>MAT 1:4</string>
-      <VerseData Hash="AF1A38D5">
+      <VerseData>
         <Cluster>
           <Range Index="11" Length="5" />
           <Lexeme Id="Word:stuff" GlossId="dyke5/hD" />
         </Cluster>
         <Cluster>
           <Range Index="5" Length="5" />
-          <Lexeme Id="Word:faadd" GlossId="WoCpeFuq" />
+          <Lexeme Id="Word:faadd" GlossId="4GryK1BC" />
         </Cluster>
         <Cluster>
           <Range Index="17" Length="3" />
-          <Lexeme Id="Stem:s-d-f" GlossId="4mZT2YvC" />
-          <Lexeme Id="Suffix:ing" GlossId="xk9pREWs" />
+          <Lexeme Id="Stem:s-d-f" GlossId="8CNbqoRc" />
+          <Lexeme Id="Suffix:ing" GlossId="iF7p009J" />
         </Cluster>
         <Cluster>
           <Range Index="17" Length="3" />
-          <Lexeme Id="Word:sdf" GlossId="ykAsdbgI" />
+          <Lexeme Id="Word:sdf" GlossId="TdiAoND6" />
+        </Cluster>
+        <Cluster>
+          <Range Index="62" Length="3" />
+          <Lexeme Id="Stem:s-d-f" />
+          <Lexeme Id="Suffix:ing" GlossId="iF7p009J" />
+        </Cluster>
+        <Cluster>
+          <Range Index="62" Length="3" />
+          <Lexeme Id="Word:sdf" GlossId="TdiAoND6" />
         </Cluster>
         <Cluster>
           <Range Index="21" Length="5" />
-          <Lexeme Id="Prefix:d" GlossId="jHH2DM97" />
-          <Lexeme Id="Stem:fsdf" GlossId="K2oLV5Iy" />
+          <Lexeme Id="Prefix:d" GlossId="S8asx9yv" />
+          <Lexeme Id="Stem:fsdf" GlossId="+WSVZ5in" />
         </Cluster>
         <Cluster>
           <Range Index="21" Length="5" />
-          <Lexeme Id="Word:dfsdf" GlossId="ey+/hxRw" />
+          <Lexeme Id="Word:dfsdf" GlossId="owZ41UQ6" />
         </Cluster>
         <Cluster>
           <Range Index="27" Length="11" />
-          <Lexeme Id="Word:tookaymas𝔓" GlossId="qEEdeKKs" />
+          <Lexeme Id="Word:tookaymas𝔓" GlossId="fTVcq9yO" />
         </Cluster>
         <Cluster>
           <Range Index="39" Length="5" />
-          <Lexeme Id="Word:کراݩو" GlossId="3wET0Qj/" />
+          <Lexeme Id="Word:کراݩو" GlossId="cKejZSAA" />
         </Cluster>
         <Cluster>
           <Range Index="45" Length="6" />
-          <Lexeme Id="Word:چاہویں" GlossId="EBU/8UEE" />
+          <Lexeme Id="Word:چاہویں" GlossId="+3crR6Y/" />
         </Cluster>
         <Cluster>
           <Range Index="55" Length="6" />
-          <Lexeme Id="Stem:sdfs" GlossId="qOH8K+vk" />
-          <Lexeme Id="Suffix:df" GlossId="FAFjjl3U" />
+          <Lexeme Id="Stem:sdfs" GlossId="93TZzQ/i" />
+          <Lexeme Id="Suffix:df" GlossId="prYQcJEY" />
         </Cluster>
         <Cluster>
           <Range Index="55" Length="6" />
-          <Lexeme Id="Word:sdfsdf" GlossId="+mt3kR8H" />
-        </Cluster>
-        <Cluster>
-          <Range Index="62" Length="3" />
-          <Lexeme Id="Stem:s-d-f" GlossId="4mZT2YvC" />
-          <Lexeme Id="Suffix:ing" GlossId="xk9pREWs" />
-        </Cluster>
-        <Cluster>
-          <Range Index="62" Length="3" />
-          <Lexeme Id="Word:sdf" GlossId="ykAsdbgI" />
+          <Lexeme Id="Word:sdfsdf" GlossId="4pLJKbZn" />
         </Cluster>
       </VerseData>
     </item>
@@ -308,116 +308,64 @@
       <VerseData>
         <Cluster>
           <Range Index="5" Length="3" />
-          <Lexeme Id="Stem:s-d-f" GlossId="4mZT2YvC" />
-          <Lexeme Id="Suffix:ing" GlossId="xk9pREWs" />
+          <Lexeme Id="Word:sdf" GlossId="TdiAoND6" />
         </Cluster>
         <Cluster>
-          <Range Index="5" Length="3" />
-          <Lexeme Id="Word:sdf" GlossId="ykAsdbgI" />
+          <Range Index="9" Length="12" />
+          <Lexeme Id="Word:ffffffffffff" GlossId="zcDFxEid" />
         </Cluster>
         <Cluster>
-          <Range Index="9" Length="12" />
-          <Lexeme Id="Word:ffffffffffff" GlossId="M/5hfFkv" />
+          <Range Index="22" Length="4" />
+          <Lexeme Id="Word:what" GlossId="TM417MV+" />
         </Cluster>
         <Cluster>
-          <Range Index="27" Length="2" />
-          <Lexeme Id="Stem:is" GlossId="QEYHInCl" />
+          <Range Index="36" Length="2" />
+          <Lexeme Id="Prefix:d" />
+          <Lexeme Id="Stem:f" GlossId="eFrRDfP3" />
         </Cluster>
         <Cluster>
-          <Range Index="27" Length="2" />
-          <Lexeme Id="Word:is" GlossId="2H3/ch0V" />
+          <Range Index="36" Length="2" />
+          <Lexeme Id="Word:df" GlossId="6AsBnMQ5" />
         </Cluster>
         <Cluster>
-          <Range Index="22" Length="4" />
-          <Lexeme Id="Word:what" GlossId="2a50dOFA" />
+          <Range Index="39" Length="5" />
+          <Lexeme Id="Prefix:d" />
+          <Lexeme Id="Stem:fdsf" GlossId="r1MOcQ/K" />
+        </Cluster>
+        <Cluster>
+          <Range Index="39" Length="5" />
+          <Lexeme Id="Word:dfdsf" GlossId="xLL/Th1K" />
         </Cluster>
         <Cluster>
-          <Range Index="30" Length="4" />
-          <Lexeme Id="Stem:this" GlossId="h/+ljGCH" />
-          <Lexeme Id="Suffix:sd" GlossId="SeQE/qST" />
+          <Range Index="45" Length="5" />
+          <Lexeme Id="Word:hello" GlossId="JssW5c35" />
         </Cluster>
         <Cluster>
-          <Range Index="30" Length="4" />
-          <Lexeme Id="Word:this" GlossId="P4udOghs" />
+          <Range Index="51" Length="10" />
+          <Lexeme Id="Word:unjjiverse" GlossId="FE33NkYk" />
+        </Cluster>
+        <Cluster>
+          <Range Index="62" Length="4" />
+          <Lexeme Id="Word:this" GlossId="YlAzyGzv" />
+        </Cluster>
+        <Cluster>
+          <Range Index="67" Length="2" />
+          <Lexeme Id="Word:is" GlossId="oLsTdKko" />
+        </Cluster>
+        <Cluster>
+          <Range Index="70" Length="1" />
+          <Lexeme Id="Word:a" GlossId="yp9hjBeA" />
+        </Cluster>
+        <Cluster>
+          <Range Index="72" Length="4" />
+          <Lexeme Id="Stem:te" GlossId="kBBBqmYT" />
+          <Lexeme Id="Suffix:st" />
         </Cluster>
-        <Punctuation>
-          <Range Index="34" Length="2" />
-          <BeforeText>? </BeforeText>
-          <AfterText>? </AfterText>
-        </Punctuation>
       </VerseData>
     </item>
-    <item>
-      <string>MAT 1:0</string>
-      <VerseData />
-    </item>
     <item>
       <string>MAT 1:7kadh</string>
       <VerseData />
     </item>
-    <item>
-      <string>MAT 1:8-hEdllo</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:10T</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:11fff</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:12qqqqqqqqqqffffffff</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:13Jeff</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:13JEff</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:14Why</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:19amwhEn</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:15C2</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:18</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:19</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:20</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:21</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:22</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:23</string>
-      <VerseData />
-    </item>
-    <item>
-      <string>MAT 1:24</string>
-      <VerseData />
-    </item>
   </Verses>
 </InterlinearData>
diff --git a/test-data/Lexicon.xml b/test-data/Lexicon.xml
new file mode 100644
index 0000000..9f5309b
--- /dev/null
+++ b/test-data/Lexicon.xml
@@ -0,0 +1,4232 @@
+﻿<?xml version="1.0" encoding="utf-8"?>
+<Lexicon>
+  <Language>en</Language>
+  <FontName>Scheherazade New</FontName>
+  <FontSize>12</FontSize>
+  <Analyses />
+  <Entries>
+    <item>
+      <Lexeme Type="Word" Form="rubapiita" Homograph="1" />
+      <Entry>
+        <Sense Id="55zI9AwZ">
+          <Gloss Language="hbo">סדטsdט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="opaitabaaro" Homograph="1" />
+      <Entry>
+        <Sense Id="z+zpTHM6">
+          <Gloss Language="hbo">סדט</Gloss>
+        </Sense>
+        <Sense Id="Bz64CuI5">
+          <Gloss Language="hbo">סדטסדטsדט</Gloss>
+        </Sense>
+        <Sense Id="S3mtFTi3">
+          <Gloss Language="hbo">ססדטסדטsדטדט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="rubapiitasfd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="rubapiitasfdsdfsf" Homograph="1" />
+      <Entry>
+        <Sense Id="fZdErF4a">
+          <Gloss Language="hbo">סdט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="in" Homograph="1" />
+      <Entry>
+        <Sense Id="E3SS4Dgy">
+          <Gloss Language="hbo">סדט</Gloss>
+        </Sense>
+        <Sense Id="6wa5ZOr2">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="33PpaKka">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="FfZtnD4s">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="gghhelloho" Homograph="1" />
+      <Entry>
+        <Sense Id="n7zX5f5m">
+          <Gloss Language="hbo">ֶר</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="d" Homograph="1" />
+      <Entry>
+        <Sense Id="wq/iyJMV">
+          <Gloss Language="hbo">בֹּקֶר</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="goqqhhwww" Homograph="1" />
+      <Entry>
+        <Sense Id="uWid1Bn7">
+          <Gloss Language="hbo">סדטסדט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="gg goqqhhwww" Homograph="1" />
+      <Entry>
+        <Sense Id="3IOE0NZ+">
+          <Gloss Language="hbo">דסט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="goqqhhwww" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="sdfsdf" Homograph="1" />
+      <Entry>
+        <Sense Id="cLTlxkSJ">
+          <Gloss Language="hbo">סdטסדט סד</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="sdf" Homograph="1" />
+      <Entry>
+        <Sense Id="F8PjZhmN">
+          <Gloss Language="hbo">סדטסדטסדט</Gloss>
+        </Sense>
+        <Sense Id="WlYqAsmr">
+          <Gloss Language="grc">σδφαααα</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ll" Homograph="1" />
+      <Entry>
+        <Sense Id="jgsvwbIO">
+          <Gloss Language="hbo">sדט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="hhgo" Homograph="1" />
+      <Entry>
+        <Sense Id="cTxHdMXp">
+          <Gloss Language="hbo">sדט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="fffff" Homograph="1" />
+      <Entry>
+        <Sense Id="jWgg6DU+">
+          <Gloss Language="hbo">סדט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="hh" Homograph="1" />
+      <Entry>
+        <Sense Id="SJmoeaIb">
+          <Gloss Language="hbo">סדט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="hello" Homograph="1" />
+      <Entry>
+        <Sense Id="+U+lJu98">
+          <Gloss Language="hbo">ֶרת</Gloss>
+        </Sense>
+        <Sense Id="DTavUCfw">
+          <Gloss Language="hbo">סdטסדט</Gloss>
+        </Sense>
+        <Sense Id="/UGIBbU1">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="MpCKiZlt">
+          <Gloss Language="grc">ηελλο</Gloss>
+        </Sense>
+        <Sense Id="OMK1KkbQ">
+          <Gloss Language="pt">World</Gloss>
+        </Sense>
+        <Sense Id="Fz1CNXo3">
+          <Gloss Language="en">good</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="world" Homograph="1" />
+      <Entry>
+        <Sense Id="cBIv5UJA">
+          <Gloss Language="hbo">ֶרת</Gloss>
+        </Sense>
+        <Sense Id="1jnPtTqK">
+          <Gloss Language="hbo">סדטsדט</Gloss>
+        </Sense>
+        <Sense Id="oTmOINVw">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="0DCSOYfT">
+          <Gloss Language="grc">ωορλδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="qw" Homograph="1" />
+      <Entry>
+        <Sense Id="8vVAZ2Ui">
+          <Gloss Language="hbo">sדטסדטסדט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="d hh" Homograph="1" />
+      <Entry>
+        <Sense Id="ak9gXOif">
+          <Gloss Language="hbo">סדטסdט</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="for" Homograph="1" />
+      <Entry>
+        <Sense Id="NLW8C/qT">
+          <Gloss Language="grc">φορεεεε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="for" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ed" Homograph="1" />
+      <Entry>
+        <Sense Id="B41hG9en">
+          <Gloss Language="grc">παστ τενσε</Gloss>
+        </Sense>
+        <Sense Id="BfOsfYxE">
+          <Gloss Language="grc">φφ</Gloss>
+        </Sense>
+        <Sense Id="KxYzuPMI">
+          <Gloss Language="grc">φφεφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="cat" Homograph="1" />
+      <Entry>
+        <Sense Id="xLmKVgjE">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="uNORhen/">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="lFS0/D1+">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="TXie+cvK">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="aNKcZBBF">
+          <Gloss Language="grc">φ</Gloss>
+        </Sense>
+        <Sense Id="7nhAfNuP">
+          <Gloss Language="grc">ρρ</Gloss>
+        </Sense>
+        <Sense Id="UcIGGczB">
+          <Gloss Language="grc">ρρδφγ</Gloss>
+        </Sense>
+        <Sense Id="sj0iqezv">
+          <Gloss Language="en">sdfdf</Gloss>
+        </Sense>
+        <Sense Id="TAmkxCzy">
+          <Gloss Language="en">sdf</Gloss>
+        </Sense>
+        <Sense Id="qDDFOdgV">
+          <Gloss Language="en">sdfs fsdf sfd</Gloss>
+        </Sense>
+        <Sense Id="KyKXxe8e">
+          <Gloss Language="en">sdfs fsdf sfd sdf sdfsdf sdf sdf sdf sdfs dfsdf</Gloss>
+        </Sense>
+        <Sense Id="mJ6vUl64">
+          <Gloss Language="en">
+          dfs fsdf sfd sdf sdfsdf sdf sdf sdf sdfs dfsdf sdfs fsdf sfd sdf sdfsdf sdf sdf sdf sdfs dfsdf
+          </Gloss>
+        </Sense>
+        <Sense Id="PvdY5dRK">
+          <Gloss Language="en">a</Gloss>
+        </Sense>
+        <Sense Id="AsFJq9BR">
+          <Gloss Language="en">a sdf sdfsd fs df</Gloss>
+        </Sense>
+        <Sense Id="m5cAlYVp">
+          <Gloss Language="en">dog</Gloss>
+        </Sense>
+        <Sense Id="vb6Wfa1z">
+          <Gloss Language="en">cat</Gloss>
+        </Sense>
+        <Sense Id="EjLQuOgr">
+          <Gloss Language="en">Cat</Gloss>
+        </Sense>
+        <Sense Id="EcTXwVYE">
+          <Gloss Language="en">cat</Gloss>
+        </Sense>
+        <Sense Id="etw1UVV0">
+          <Gloss Language="en">kat</Gloss>
+        </Sense>
+        <Sense Id="QoOLu3hf">
+          <Gloss Language="en">Kat</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="the" Homograph="1" />
+      <Entry>
+        <Sense Id="5jZ2QRcg">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="Cs+NMSAa">
+          <Gloss Language="grc">τηεεζζζζζaαααεεεεεεεεεε</Gloss>
+        </Sense>
+        <Sense Id="/zF8FW1/">
+          <Gloss Language="grc">τηεεεζζζζζζζζζζζζζ</Gloss>
+        </Sense>
+        <Sense Id="QAffMqUy">
+          <Gloss Language="grc">τηεεεεθθαθζ</Gloss>
+        </Sense>
+        <Sense Id="cQXUT7Sp">
+          <Gloss Language="grc">τῇαζζζζζζζζζζζζζ</Gloss>
+        </Sense>
+        <Sense Id="gImZPfvd">
+          <Gloss Language="grc">τηεεεεσδφ ]ζζζζζζζζζζζζζ</Gloss>
+        </Sense>
+        <Sense Id="h9vqoD7M">
+          <Gloss Language="grc">τηεεεεσδφ ζζζζζζζζζζζζζ</Gloss>
+        </Sense>
+        <Sense Id="p1C4vDLM">
+          <Gloss Language="grc">τηεεεεσδφ σδφ σδφ</Gloss>
+        </Sense>
+        <Sense Id="eAl0npqx">
+          <Gloss Language="grc">τηεεεεσδφ σδφ σδφσδφ σδφ</Gloss>
+        </Sense>
+        <Sense Id="9g1MwCd0">
+          <Gloss Language="grc">τηεεεεσδφ σδφ σδφσδφ σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="2h5SnBbQ">
+          <Gloss Language="grc">τηεεεεσδφ σδφ σδφσδφ σδφσδφσφ σδφ</Gloss>
+        </Sense>
+        <Sense Id="ikOgjrx4">
+          <Gloss Language="grc">τηεεεεσδφ σδφ σδφσδφ σδφσδφσφ σδφσdφ σδ φ</Gloss>
+        </Sense>
+        <Sense Id="fWnE8mjG">
+          <Gloss Language="grc">σδεεεεεεεεεεεεε</Gloss>
+        </Sense>
+        <Sense Id="eAMiWRpt">
+          <Gloss Language="en">the</Gloss>
+        </Sense>
+        <Sense Id="xLXVnXcK">
+          <Gloss Language="grc">εεε</Gloss>
+        </Sense>
+        <Sense Id="lZPLJkLV">
+          <Gloss Language="grc">jj</Gloss>
+        </Sense>
+        <Sense Id="SBzkOZMe">
+          <Gloss Language="grc">υυ\</Gloss>
+        </Sense>
+        <Sense Id="GtW2fxCM">
+          <Gloss Language="grc">υυ</Gloss>
+        </Sense>
+        <Sense Id="YzBzmzAs">
+          <Gloss Language="en">EHT</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="sdf sdfsdf" Homograph="1" />
+      <Entry>
+        <Sense Id="Etnr12fQ">
+          <Gloss Language="grc">ηελλο</Gloss>
+        </Sense>
+        <Sense Id="feIINnwW">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="is" Homograph="1" />
+      <Entry>
+        <Sense Id="0597YKnS">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="XPUKetAm">
+          <Gloss Language="grc">ισφφωωωωωωωωωω</Gloss>
+        </Sense>
+        <Sense Id="CSBZ/7Hf">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="0EoBUj9C">
+          <Gloss Language="pt">Hello</Gloss>
+        </Sense>
+        <Sense Id="oLsTdKko">
+          <Gloss Language="en">huss</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="this is" Homograph="1" />
+      <Entry>
+        <Sense Id="o9+dqkiP">
+          <Gloss Language="grc">τηισ ισ α τεστ</Gloss>
+        </Sense>
+        <Sense Id="QZ6OSjQe">
+          <Gloss Language="grc">τηε ρεδ δονκεψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="this" Homograph="1" />
+      <Entry>
+        <Sense Id="mFIhTQbF">
+          <Gloss Language="grc">τηισ</Gloss>
+        </Sense>
+        <Sense Id="h7M+WoYA">
+          <Gloss Language="grc">τηισ</Gloss>
+        </Sense>
+        <Sense Id="HjO9AEIv">
+          <Gloss Language="en">dis</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="sd" Homograph="1" />
+      <Entry>
+        <Sense Id="j7ERAznM">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="WekF5Iii">
+          <Gloss Language="en">-ed</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="conflict" Homograph="1" />
+      <Entry>
+        <Sense Id="yGcbWrEs">
+          <Gloss Language="grc">σφδ</Gloss>
+        </Sense>
+        <Sense Id="mjOvRd1J">
+          <Gloss Language="grc">χονφλιχτ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="on lenovo" Homograph="1" />
+      <Entry>
+        <Sense Id="0PVbRQmz">
+          <Gloss Language="grc">ασδαδσ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="on" Homograph="1" />
+      <Entry>
+        <Sense Id="3hDCc/fg">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="WwENTlXE">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="xqX/mZJ+">
+          <Gloss Language="grc">υυ</Gloss>
+        </Sense>
+        <Sense Id="Eu5AaoXX">
+          <Gloss Language="en">sfd</Gloss>
+        </Sense>
+        <Sense Id="AzKtJT4u">
+          <Gloss Language="en">on</Gloss>
+        </Sense>
+        <Sense Id="a3UhIzTr">
+          <Gloss Language="en">on</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="lenovo" Homograph="1" />
+      <Entry>
+        <Sense Id="/+P2Ybts">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="a" Homograph="1" />
+      <Entry>
+        <Sense Id="Hp6uhqe1">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="vU7z9MLd">
+          <Gloss Language="grc">ααα</Gloss>
+        </Sense>
+        <Sense Id="eE/T8ILH">
+          <Gloss Language="pt">Test</Gloss>
+        </Sense>
+        <Sense Id="yp9hjBeA">
+          <Gloss Language="en">e</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="bb" Homograph="1" />
+      <Entry>
+        <Sense Id="fcAfMpQy">
+          <Gloss Language="grc">ββ</Gloss>
+        </Sense>
+        <Sense Id="Bmfktr8X">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ccc" Homograph="1" />
+      <Entry>
+        <Sense Id="WI+gbsrg">
+          <Gloss Language="grc">χχχ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dddd" Homograph="1" />
+      <Entry>
+        <Sense Id="kPZbzjZ0">
+          <Gloss Language="grc">δδδδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="after" Homograph="1" />
+      <Entry>
+        <Sense Id="mE2qhqIb">
+          <Gloss Language="grc">αφτερ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="foornote" Homograph="1" />
+      <Entry>
+        <Sense Id="O5QUTPUf">
+          <Gloss Language="grc">φοοτνοτε</Gloss>
+        </Sense>
+        <Sense Id="xeJfBZVI">
+          <Gloss Language="grc">φοοτνοτε2</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="now" Homograph="1" />
+      <Entry>
+        <Sense Id="nLBBcxHR">
+          <Gloss Language="grc">νοω</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="we" Homograph="1" />
+      <Entry>
+        <Sense Id="iKtGJ2TQ">
+          <Gloss Language="grc">ωε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="have" Homograph="1" />
+      <Entry>
+        <Sense Id="3M0lqpzp">
+          <Gloss Language="grc">ηαςε</Gloss>
+        </Sense>
+        <Sense Id="bDnAdt14">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="bigger" Homograph="1" />
+      <Entry>
+        <Sense Id="8uHB6JAT">
+          <Gloss Language="grc">βιγγερ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="e" Homograph="1" />
+      <Entry>
+        <Sense Id="LYd86QIz">
+          <Gloss Language="grc">ε</Gloss>
+        </Sense>
+        <Sense Id="Wpp5Op9P">
+          <Gloss Language="grc">εε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="footnote" Homograph="1" />
+      <Entry>
+        <Sense Id="fc2O9ppm">
+          <Gloss Language="grc">φοοτνοτε</Gloss>
+        </Sense>
+        <Sense Id="7/3968id">
+          <Gloss Language="grc">φοοτνοτεε</Gloss>
+        </Sense>
+        <Sense Id="MkkdFznP">
+          <Gloss Language="en">pnot</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="i am using it to test interlinearization layout" Homograph="1" />
+      <Entry>
+        <Sense Id="CfCwSXkn">
+          <Gloss Language="grc">ρρ</Gloss>
+        </Sense>
+        <Sense Id="0cLFuJXj">
+          <Gloss Language="grc">ρρω</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sdfsdf" Homograph="1" />
+      <Entry>
+        <Sense Id="fpmT+N0Y">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="4pLJKbZn">
+          <Gloss Language="en">sdfbv</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sdf" Homograph="1" />
+      <Entry>
+        <Sense Id="IrFQcqbc">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="T8idKSvM">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="IdWss2P+">
+          <Gloss Language="grc">σδφ dσφ</Gloss>
+        </Sense>
+        <Sense Id="EC0UxUVs">
+          <Gloss Language="grc">σδφ dσφdσφ σδφ σδφ σδφ σδφ σδφ σδφφ sδsδφ</Gloss>
+        </Sense>
+        <Sense Id="nsT0pdqL">
+          <Gloss Language="grc">Σαλτ</Gloss>
+        </Sense>
+        <Sense Id="uTUso/yJ">
+          <Gloss Language="grc">σαλτ</Gloss>
+        </Sense>
+        <Sense Id="zFa3Ka9F">
+          <Gloss Language="grc">Salt</Gloss>
+        </Sense>
+        <Sense Id="TdiAoND6">
+          <Gloss Language="en">sday</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="hello world" Homograph="1" />
+      <Entry>
+        <Sense Id="FmFx4PO8">
+          <Gloss Language="grc">ηελλο ωορλδ</Gloss>
+        </Sense>
+        <Sense Id="qMGT5dwV">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="xyz" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="abc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="-def" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="abc" Homograph="1" />
+      <Entry>
+        <Sense Id="u97xeVou">
+          <Gloss Language="grc">θ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="fds" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="def" Homograph="1" />
+      <Entry>
+        <Sense Id="NRFkD96Z">
+          <Gloss Language="grc">ω</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="s" Homograph="1" />
+      <Entry>
+        <Sense Id="IM5BBaRl">
+          <Gloss Language="grc">ε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="hij" Homograph="1" />
+      <Entry>
+        <Sense Id="i82AMpIW">
+          <Gloss Language="grc">ρ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="klm" Homograph="1" />
+      <Entry>
+        <Sense Id="iy9eUXYy">
+          <Gloss Language="grc">τ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="a" Homograph="1" />
+      <Entry>
+        <Sense Id="hrEP17RI">
+          <Gloss Language="grc">α</Gloss>
+        </Sense>
+        <Sense Id="I2zXrFUn">
+          <Gloss Language="grc">δφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="bc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="aaaa" Homograph="1" />
+      <Entry>
+        <Sense Id="wm5VNwsv">
+          <Gloss Language="en">e</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="xyd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="word" Homograph="1" />
+      <Entry>
+        <Sense Id="JkDJLXtr">
+          <Gloss Language="grc">ωορδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="xyz" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="word" Homograph="1" />
+      <Entry>
+        <Sense Id="NIRgQ4a9">
+          <Gloss Language="grc">ἕκτος</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="he said" Homograph="1" />
+      <Entry>
+        <Sense Id="//UsWFVa">
+          <Gloss Language="grc">σαιδ εη</Gloss>
+        </Sense>
+        <Sense Id="yFtvBF+w">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="GAzFkHet">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="xP8R5Xaq">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="HxqmsJSP">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="ocfwtoUo">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="8W+FabMl">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="he was" Homograph="1" />
+      <Entry>
+        <Sense Id="xte+wj0o">
+          <Gloss Language="grc">he was</Gloss>
+        </Sense>
+        <Sense Id="+U47XsPA">
+          <Gloss Language="grc">was he</Gloss>
+        </Sense>
+        <Sense Id="rjspyzyM">
+          <Gloss Language="grc">la la</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="sky" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="on the mat" Homograph="1" />
+      <Entry>
+        <Sense Id="uTqlSQpY">
+          <Gloss Language="grc">ταμ εητ νο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="blue" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="long" Homograph="1" />
+      <Entry>
+        <Sense Id="hGN6nY5Z">
+          <Gloss Language="grc">λονγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="some" Homograph="1" />
+      <Entry>
+        <Sense Id="0j4n4llV">
+          <Gloss Language="grc">σομε</Gloss>
+        </Sense>
+        <Sense Id="0CxApO8D">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="also" Homograph="1" />
+      <Entry>
+        <Sense Id="sEfMjLId">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="i" Homograph="1" />
+      <Entry>
+        <Sense Id="UtKSIZ4G">
+          <Gloss Language="grc">Ι</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="another" Homograph="1" />
+      <Entry>
+        <Sense Id="bS4FdvVw">
+          <Gloss Language="grc">ανοτηερ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="hi" Homograph="1" />
+      <Entry>
+        <Sense Id="CTB7LqDC">
+          <Gloss Language="grc">ηι</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ho" Homograph="1" />
+      <Entry>
+        <Sense Id="jOEP/J/w">
+          <Gloss Language="grc">ηο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="abc ho hi" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="e ho hi" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="hello" Homograph="1" />
+      <Entry>
+        <Sense Id="HoPTZa5Z">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="Ol9DCeLd">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="NdWt6l81">
+          <Gloss Language="grc">ηηηηη</Gloss>
+        </Sense>
+        <Sense Id="JSt5NtLi">
+          <Gloss Language="grc">ηηηηηη</Gloss>
+        </Sense>
+        <Sense Id="vU9M1/fQ">
+          <Gloss Language="grc">ηηηηηηη</Gloss>
+        </Sense>
+        <Sense Id="/Rbh6XQD">
+          <Gloss Language="tpi">sdf</Gloss>
+        </Sense>
+        <Sense Id="EG8QCpWU">
+          <Gloss Language="grc">ηελλο</Gloss>
+        </Sense>
+        <Sense Id="ZBSRu9GP">
+          <Gloss Language="pt">Hekli</Gloss>
+        </Sense>
+        <Sense Id="myzmQpkS">
+          <Gloss Language="pt">🤗</Gloss>
+        </Sense>
+        <Sense Id="JssW5c35">
+          <Gloss Language="en">g'day</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="world" Homograph="1" />
+      <Entry>
+        <Sense Id="FA0AX46w">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="lDQpzoCO">
+          <Gloss Language="grc">ΩΟΡΔ</Gloss>
+        </Sense>
+        <Sense Id="D2gG/hyU">
+          <Gloss Language="grc">ωορλδ</Gloss>
+        </Sense>
+        <Sense Id="yaC0qDLJ">
+          <Gloss Language="pt">🌎</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="this" Homograph="1" />
+      <Entry>
+        <Sense Id="zkePVjkK">
+          <Gloss Language="grc">τηισ</Gloss>
+        </Sense>
+        <Sense Id="5SJRtyPd">
+          <Gloss Language="pt">Hi</Gloss>
+        </Sense>
+        <Sense Id="YlAzyGzv">
+          <Gloss Language="en">dissed</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="test" Homograph="1" />
+      <Entry>
+        <Sense Id="ZoW/QTE/">
+          <Gloss Language="grc">τεστ</Gloss>
+        </Sense>
+        <Sense Id="O5ff5Ajk">
+          <Gloss Language="grc">Τεστινγ</Gloss>
+        </Sense>
+        <Sense Id="I6FbHzN+">
+          <Gloss Language="pt">World</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="aa" Homograph="1" />
+      <Entry>
+        <Sense Id="qQIUL4xq">
+          <Gloss Language="grc">αα</Gloss>
+        </Sense>
+        <Sense Id="2UMLnjO5">
+          <Gloss Language="grc">ααα</Gloss>
+        </Sense>
+        <Sense Id="R31UTexf">
+          <Gloss Language="grc">sdf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="on the mat" Homograph="1" />
+      <Entry>
+        <Sense Id="+8YC5+8V">
+          <Gloss Language="grc">ταμ εητ νο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="he said" Homograph="1" />
+      <Entry>
+        <Sense Id="r+3J1i7I">
+          <Gloss Language="grc">σαιδ εη</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="he was" Homograph="1" />
+      <Entry>
+        <Sense Id="Pu5MtGS8">
+          <Gloss Language="grc">eh saw</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="was" Homograph="1" />
+      <Entry>
+        <Sense Id="nX1ELDWe">
+          <Gloss Language="grc">ωασ</Gloss>
+        </Sense>
+        <Sense Id="xz4ENtlX">
+          <Gloss Language="grc">σφσφ</Gloss>
+        </Sense>
+        <Sense Id="W99MaNG6">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="he" Homograph="1" />
+      <Entry>
+        <Sense Id="PYgfwTDw">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="undefined" Homograph="1" />
+      <Entry>
+        <Sense Id="FcpK4N7t">
+          <Gloss Language="grc">sdf</Gloss>
+        </Sense>
+        <Sense Id="W+DL32F3">
+          <Gloss Language="grc">sdfsdf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="said" Homograph="1" />
+      <Entry>
+        <Sense Id="eZhBRNIp">
+          <Gloss Language="grc">sdf</Gloss>
+        </Sense>
+        <Sense Id="vgn7A9HT">
+          <Gloss Language="grc">sdfsf</Gloss>
+        </Sense>
+        <Sense Id="a9vUt+Av">
+          <Gloss Language="en">spoke</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="well" Homograph="1" />
+      <Entry>
+        <Sense Id="CiCu9J2s">
+          <Gloss Language="grc">dfg</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="happy" Homograph="1" />
+      <Entry>
+        <Sense Id="pNUPnj0s">
+          <Gloss Language="grc">dfg</Gloss>
+        </Sense>
+        <Sense Id="STyOUB5B">
+          <Gloss Language="grc">σδφσfδ</Gloss>
+        </Sense>
+        <Sense Id="MYJfNaHi">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sat" Homograph="1" />
+      <Entry>
+        <Sense Id="tzWSbjVs">
+          <Gloss Language="grc">dfg</Gloss>
+        </Sense>
+        <Sense Id="kapunTo6">
+          <Gloss Language="grc">δδ</Gloss>
+        </Sense>
+        <Sense Id="ImYY1dpD">
+          <Gloss Language="en">tas</Gloss>
+        </Sense>
+        <Sense Id="eJhuE/p7">
+          <Gloss Language="en">SAT</Gloss>
+        </Sense>
+        <Sense Id="bzJ5nKra">
+          <Gloss Language="en">sat</Gloss>
+        </Sense>
+        <Sense Id="iPwPxSPY">
+          <Gloss Language="en">wer</Gloss>
+        </Sense>
+        <Sense Id="rdeoOZl3">
+          <Gloss Language="en">abc</Gloss>
+        </Sense>
+        <Sense Id="SzGzTfWQ">
+          <Gloss Language="en">sat</Gloss>
+        </Sense>
+        <Sense Id="Lk0fhVCU">
+          <Gloss Language="en">aST</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="The" Homograph="1" />
+      <Entry>
+        <Sense Id="4Q6+FxF6">
+          <Gloss Language="grc">dfg</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="the mat" Homograph="1" />
+      <Entry>
+        <Sense Id="Dl3EC2mH">
+          <Gloss Language="grc">σδφσδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="v2mvukUt">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="tklbC1PF">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="Tpw5i6TF">
+          <Gloss Language="grc">δφγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="was happy" Homograph="1" />
+      <Entry>
+        <Sense Id="4WNuxULB">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="the cat" Homograph="1" />
+      <Entry>
+        <Sense Id="0IanqLxN">
+          <Gloss Language="grc">σδφσδφ σδφ σδφ</Gloss>
+        </Sense>
+        <Sense Id="9VvyFvnj">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="PxnfSgGn">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="gEwI84UK">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="eJNRHRSm">
+          <Gloss Language="grc">ηελλο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="very long" Homograph="1" />
+      <Entry>
+        <Sense Id="aKTkGqze">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="and he was very happy" Homograph="1" />
+      <Entry>
+        <Sense Id="tzuSYGo2">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="gLqJ0p8v">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="Unvae3/1">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="gwkIZQb6">
+          <Gloss Language="grc">φσγδφγ δφγ δφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="sat on" Homograph="1" />
+      <Entry>
+        <Sense Id="he63Z1X3">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="QfXIhn2X">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="and" Homograph="1" />
+      <Entry>
+        <Sense Id="SW1k/JV0">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="OcqcyG5E">
+          <Gloss Language="grc">ανδ</Gloss>
+        </Sense>
+        <Sense Id="SjBgXQaJ">
+          <Gloss Language="en">and</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="mat" Homograph="1" />
+      <Entry>
+        <Sense Id="ajBN3HhZ">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="nBpamNy1">
+          <Gloss Language="en">fat</Gloss>
+        </Sense>
+        <Sense Id="dxnWwuho">
+          <Gloss Language="en">FAT</Gloss>
+        </Sense>
+        <Sense Id="LgvJH5g0">
+          <Gloss Language="en">mat</Gloss>
+        </Sense>
+        <Sense Id="echBnoex">
+          <Gloss Language="en">mat</Gloss>
+        </Sense>
+        <Sense Id="TJcXHNLR">
+          <Gloss Language="en">sfd</Gloss>
+        </Sense>
+        <Sense Id="4yXbOln5">
+          <Gloss Language="en">MAT</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="aa hello world" Homograph="1" />
+      <Entry>
+        <Sense Id="90/jBL2z">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="01aArLX0">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="jBd06AKJ">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="voice" Homograph="1" />
+      <Entry>
+        <Sense Id="GQmb3qoc">
+          <Gloss Language="grc">φωνή</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="calling" Homograph="1" />
+      <Entry>
+        <Sense Id="H0IiJz6Q">
+          <Gloss Language="grc">bo-ah'-o </Gloss>
+        </Sense>
+        <Sense Id="TKSMrp0m">
+          <Gloss Language="grc">bo-ah'-o</Gloss>
+        </Sense>
+        <Sense Id="2MlRazxM">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="rFL17c9x">
+          <Gloss Language="grc">βοῶντος</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="wilderness" Homograph="1" />
+      <Entry>
+        <Sense Id="uoGHKDKq">
+          <Gloss Language="grc">w</Gloss>
+        </Sense>
+        <Sense Id="m7ZTnuW4">
+          <Gloss Language="grc">weagee</Gloss>
+        </Sense>
+        <Sense Id="09ZVXgqA">
+          <Gloss Language="grc">αβα</Gloss>
+        </Sense>
+        <Sense Id="wqYMT2k0">
+          <Gloss Language="grc">ἔρημος</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="paths" Homograph="1" />
+      <Entry>
+        <Sense Id="jdoggPt+">
+          <Gloss Language="grc">πατησ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="Lord" Homograph="1" />
+      <Entry>
+        <Sense Id="K3Eta9iu">
+          <Gloss Language="grc">καιροσ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="straight" Homograph="1" />
+      <Entry>
+        <Sense Id="ckQwrqnM">
+          <Gloss Language="grc">σ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="of one" Homograph="1" />
+      <Entry>
+        <Sense Id="jFWNrtuT">
+          <Gloss Language="grc">ονε</Gloss>
+        </Sense>
+        <Sense Id="f6pGsnGe">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="hs4KLIJE">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="h67cFTlj">
+          <Gloss Language="grc">οφ ονε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="very" Homograph="1" />
+      <Entry>
+        <Sense Id="GoUTha/2">
+          <Gloss Language="grc">ςερψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="verse" Homograph="1" />
+      <Entry>
+        <Sense Id="e1ForEMV">
+          <Gloss Language="grc">ςeρsε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="to to to" Homograph="1" />
+      <Entry>
+        <Sense Id="fn03D46y">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="z96UBjSo">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="0DriER8j">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="rBWfe5bX">
+          <Gloss Language="grc">ηελλο</Gloss>
+        </Sense>
+        <Sense Id="YmZByw6l">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="NX/7jXKx">
+          <Gloss Language="grc">σδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="to" Homograph="1" />
+      <Entry>
+        <Sense Id="XtJLqq0/">
+          <Gloss Language="grc">το</Gloss>
+        </Sense>
+        <Sense Id="PhJqz2+o">
+          <Gloss Language="grc">τοτο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="c" Homograph="1" />
+      <Entry>
+        <Sense Id="orq17Dyo">
+          <Gloss Language="grc">χ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="b" Homograph="1" />
+      <Entry>
+        <Sense Id="/jAhyGg+">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="ySaoeRNU">
+          <Gloss Language="grc">ββΒΒββ</Gloss>
+        </Sense>
+        <Sense Id="EPfGRfgj">
+          <Gloss Language="grc">β</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="abc" Homograph="1" />
+      <Entry>
+        <Sense Id="W4nHE2N+">
+          <Gloss Language="grc">a b χ</Gloss>
+        </Sense>
+        <Sense Id="igUFw9xK">
+          <Gloss Language="en">abc</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="cc" Homograph="1" />
+      <Entry>
+        <Sense Id="Hqkjgh0U">
+          <Gloss Language="grc">δφγ</Gloss>
+        </Sense>
+        <Sense Id="TnU1LqCV">
+          <Gloss Language="grc">δδφδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="eee" Homograph="1" />
+      <Entry>
+        <Sense Id="twJyuiDa">
+          <Gloss Language="grc">εεεε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="rrr" Homograph="1" />
+      <Entry>
+        <Sense Id="vAKqTts6">
+          <Gloss Language="grc">ρρρρ</Gloss>
+        </Sense>
+        <Sense Id="iIbWwAM1">
+          <Gloss Language="grc">ρρρρδδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ttt" Homograph="1" />
+      <Entry>
+        <Sense Id="DCIsxjZt">
+          <Gloss Language="grc">τττ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="do" Homograph="1" />
+      <Entry>
+        <Sense Id="13K3qv7g">
+          <Gloss Language="grc">δο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="how" Homograph="1" />
+      <Entry>
+        <Sense Id="JrIDezha">
+          <Gloss Language="grc">ηοοω</Gloss>
+        </Sense>
+        <Sense Id="uZNu5ni2">
+          <Gloss Language="en">how</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="qwe" Homograph="1" />
+      <Entry>
+        <Sense Id="eZcW1J/t">
+          <Gloss Language="grc">θωε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sdfjlks" Homograph="1" />
+      <Entry>
+        <Sense Id="D1VwCf2x">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="Uor9A641">
+          <Gloss Language="grc">δρεδτ ετ </Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="jk" Homograph="1" />
+      <Entry>
+        <Sense Id="M1LMVoKD">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="QXOCdwVb">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="Q3HIl1PP">
+          <Gloss Language="grc">σδ φ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="jhello" Homograph="1" />
+      <Entry>
+        <Sense Id="d9vzl91b">
+          <Gloss Language="grc">ηελλο  φ</Gloss>
+        </Sense>
+        <Sense Id="Eo+RrzOc">
+          <Gloss Language="grc">ηελλο  φ  φ</Gloss>
+        </Sense>
+        <Sense Id="85Wcu1LJ">
+          <Gloss Language="grc">ηελλο  φ  φσδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="jhello hello" Homograph="1" />
+      <Entry>
+        <Sense Id="S2AR3nyB">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="q4FnXAJa">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="/oW/sAbv">
+          <Gloss Language="grc">σδφ σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dflkj" Homograph="1" />
+      <Entry>
+        <Sense Id="aYo6qvyl">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="Prepare" Homograph="1" />
+      <Entry>
+        <Sense Id="jqWKRW8v">
+          <Gloss Language="grc">αβερε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="way" Homograph="1" />
+      <Entry>
+        <Sense Id="gJL8s1EA">
+          <Gloss Language="grc">ωαψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="john appeared" Homograph="1" />
+      <Entry>
+        <Sense Id="oPan9Jih">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="preaching" Homograph="1" />
+      <Entry>
+        <Sense Id="XNkPUC1e">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="sdf world" Homograph="1" />
+      <Entry>
+        <Sense Id="EoUkEyKm">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="for the" Homograph="1" />
+      <Entry>
+        <Sense Id="FlAFI5Ov">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="for the the" Homograph="1" />
+      <Entry>
+        <Sense Id="hDAxScxc">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="xJhqj9CS">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="bT3roDpG">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="JpTBAXBw">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="q+8Pds9B">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="7tEfuB6T">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="EDWZtyY8">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="7eLuOfSm">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="UFX+2+yh">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="CFgv34J/">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="RcAr1VAE">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="YHiXb70S">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="KCJ54GEg">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="PDKbD3gd">
+          <Gloss Language="grc">σομε πηρασε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="footnote the" Homograph="1" />
+      <Entry>
+        <Sense Id="nib5/eG7">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="e41SeFq5">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="yexLjUIj">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="zD5t4R7+">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="I3oeGk7F">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="W3SK75sC">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="pkX6suC3">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="2Vy1qx49">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="fvG6atip">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="J0riXCDg">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="3QASPLRq">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="footnote the cat" Homograph="1" />
+      <Entry>
+        <Sense Id="sgZp/Mu+">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sdff" Homograph="1" />
+      <Entry>
+        <Sense Id="rU22UgVo">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="A" Homograph="1" />
+      <Entry>
+        <Sense Id="s6xCApGV">
+          <Gloss Language="grc">α</Gloss>
+        </Sense>
+        <Sense Id="OI0Jw+WF">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="YL8pAdmI">
+          <Gloss Language="grc">ω</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="man" Homograph="1" />
+      <Entry>
+        <Sense Id="AYI/xQIG">
+          <Gloss Language="grc">μαν</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="by" Homograph="1" />
+      <Entry>
+        <Sense Id="IO88fYyj">
+          <Gloss Language="grc">βψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="see" Homograph="1" />
+      <Entry>
+        <Sense Id="tDOdrM7C">
+          <Gloss Language="grc">ηελλο ωορλδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="z" Homograph="1" />
+      <Entry>
+        <Sense Id="YImWPpb2">
+          <Gloss Language="grc">ΞΖΞ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="S" Homograph="1" />
+      <Entry>
+        <Sense Id="tqAP3WPs">
+          <Gloss Language="grc">Σ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="Hello" Homograph="1" />
+      <Entry>
+        <Sense Id="RC7xjWo4">
+          <Gloss Language="grc">ηελλο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ww" Homograph="1" />
+      <Entry>
+        <Sense Id="IrTBTZXU">
+          <Gloss Language="grc">ωω</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="qq" Homograph="1" />
+      <Entry>
+        <Sense Id="2vayYg/h">
+          <Gloss Language="grc">θθ</Gloss>
+        </Sense>
+        <Sense Id="kf6P/L3F">
+          <Gloss Language="hbo">סדט</Gloss>
+        </Sense>
+        <Sense Id="wU3eapK3">
+          <Gloss Language="hbo">בבב</Gloss>
+        </Sense>
+        <Sense Id="hiBUrp+c">
+          <Gloss Language="grc">ΘΘ</Gloss>
+        </Sense>
+        <Sense Id="lxQ2CdVQ">
+          <Gloss Language="grc">ΩΩ</Gloss>
+        </Sense>
+        <Sense Id="n47XMir1">
+          <Gloss Language="grc">ερτερτ εrτ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ee" Homograph="1" />
+      <Entry>
+        <Sense Id="Pm6Z4fCE">
+          <Gloss Language="grc">ωω</Gloss>
+        </Sense>
+        <Sense Id="57nqzQbX">
+          <Gloss Language="grc">παραλυτικός</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="gg" Homograph="1" />
+      <Entry>
+        <Sense Id="1ep13u6i">
+          <Gloss Language="grc">α</Gloss>
+        </Sense>
+        <Sense Id="RJiYWar6">
+          <Gloss Language="grc">αβ</Gloss>
+        </Sense>
+        <Sense Id="lAZk+nlU">
+          <Gloss Language="grc">αβς</Gloss>
+        </Sense>
+        <Sense Id="NRsjdzZi">
+          <Gloss Language="grc">αβςδ</Gloss>
+        </Sense>
+        <Sense Id="iOaDciIF">
+          <Gloss Language="grc">αβςδε</Gloss>
+        </Sense>
+        <Sense Id="ycpSkOzI">
+          <Gloss Language="grc">αβςδεφ</Gloss>
+        </Sense>
+        <Sense Id="6W69p3lX">
+          <Gloss Language="grc">αβςδεφγ</Gloss>
+        </Sense>
+        <Sense Id="bGskvcaq">
+          <Gloss Language="grc">αβςδεφγη</Gloss>
+        </Sense>
+        <Sense Id="s2kI2vrk">
+          <Gloss Language="grc">αβςδεφγηι</Gloss>
+        </Sense>
+        <Sense Id="9u99mU8A">
+          <Gloss Language="grc">αβςδεφγηιj</Gloss>
+        </Sense>
+        <Sense Id="UEzia6j8">
+          <Gloss Language="grc">αβςδεφγηιjκ</Gloss>
+        </Sense>
+        <Sense Id="3FUAXlGm">
+          <Gloss Language="grc">αβςδεφγηιjκλ</Gloss>
+        </Sense>
+        <Sense Id="PaJyRIBz">
+          <Gloss Language="grc">αβςδεφγηιjκλμ</Gloss>
+        </Sense>
+        <Sense Id="J0LXpD9V">
+          <Gloss Language="grc">αβςδεφγηιjκλμν</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="gg gg" Homograph="1" />
+      <Entry>
+        <Sense Id="ZoPEXFKt">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="uQ6CVWVt">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="SAOAb6tN">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="gg gg goqqhhwww" Homograph="1" />
+      <Entry>
+        <Sense Id="d5q8fKTb">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="7x9oX/5v">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="qqqqdddd gg gg goqqhhwww" Homograph="1" />
+      <Entry>
+        <Sense Id="qUKPJE8a">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="act" Homograph="1" />
+      <Entry>
+        <Sense Id="xxkozIAa">
+          <Gloss Language="en">this</Gloss>
+        </Sense>
+        <Sense Id="pA7Z/Jb4">
+          <Gloss Language="grc">σdφ</Gloss>
+        </Sense>
+        <Sense Id="Ompa6IuM">
+          <Gloss Language="pt">Hello</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="text" Homograph="1" />
+      <Entry>
+        <Sense Id="5PZ3iP28">
+          <Gloss Language="en">that</Gloss>
+        </Sense>
+        <Sense Id="eMmL4aRJ">
+          <Gloss Language="en">this and that</Gloss>
+        </Sense>
+        <Sense Id="fWg6591z">
+          <Gloss Language="grc">τεξτ</Gloss>
+        </Sense>
+        <Sense Id="2UYXTkuO">
+          <Gloss Language="grc">σfδ</Gloss>
+        </Sense>
+        <Sense Id="kaQcvWx1">
+          <Gloss Language="pt">World</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="jesus" Homograph="1" />
+      <Entry>
+        <Sense Id="RWTTueOb">
+          <Gloss Language="en">Jesus</Gloss>
+        </Sense>
+        <Sense Id="IZ3pFgHs">
+          <Gloss Language="grc">JΕσυσ</Gloss>
+        </Sense>
+        <Sense Id="Ty+BAZ9z">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="RXbO4IQg">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="XvqJVocE">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="Lt/3lfIV">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="VrW2SkXi">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="7PNdzGSj">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="xfEEOFuC">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="4uEb+Wnh">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="K1clwYLC">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="8ChRUfVI">
+          <Gloss Language="pt">This</Gloss>
+        </Sense>
+        <Sense Id="b68hdc2X">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="oj" Homograph="1" />
+      <Entry>
+        <Sense Id="QKZUjplH">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="xWX4Oc5x">
+          <Gloss Language="pt">Is</Gloss>
+        </Sense>
+        <Sense Id="cUT+yjRK">
+          <Gloss Language="en">fff</Gloss>
+        </Sense>
+        <Sense Id="0kxgRN9J">
+          <Gloss Language="en">fffcc</Gloss>
+        </Sense>
+        <Sense Id="PcnyA1jA">
+          <Gloss Language="en">fffccgg</Gloss>
+        </Sense>
+        <Sense Id="4icWQ3pK">
+          <Gloss Language="en">aw</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="sdf" Homograph="1" />
+      <Entry>
+        <Sense Id="xjgALyJM">
+          <Gloss Language="grc">θηρίον</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="bb" Homograph="1" />
+      <Entry>
+        <Sense Id="UBilUkcl">
+          <Gloss Language="grc">ββ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="middle" Homograph="1" />
+      <Entry>
+        <Sense Id="aMNv3sxm">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ert" Homograph="1" />
+      <Entry>
+        <Sense Id="2+PEC0MG">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ggg" Homograph="1" />
+      <Entry>
+        <Sense Id="l0cBMD4S">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="aaaaaaaaaaaaaa" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ttt" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="www" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="first" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="second" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="A" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="B" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="C" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="sdsdf" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="before" Homograph="1" />
+      <Entry>
+        <Sense Id="mSVtka15">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="iAZwDrI+">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="zzz" Homograph="1" />
+      <Entry>
+        <Sense Id="S4vZyIw0">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="DB+DY1hD">
+          <Gloss Language="grc">φ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="b aa b" Homograph="1" />
+      <Entry>
+        <Sense Id="CLPrqkb0">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="b b b b b b" Homograph="1" />
+      <Entry>
+        <Sense Id="qNFK2Jek">
+          <Gloss Language="grc">δφγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sfsd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="f" Homograph="1" />
+      <Entry>
+        <Sense Id="5u9FbHIL">
+          <Gloss Language="grc">σδφδσφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="tt" Homograph="1" />
+      <Entry>
+        <Sense Id="TixTuiCi">
+          <Gloss Language="grc">θωερτψυιοπ</Gloss>
+        </Sense>
+        <Sense Id="A5Y0Rg+j">
+          <Gloss Language="grc">ασδφγῃκλ</Gloss>
+        </Sense>
+        <Sense Id="IAsm9ThU">
+          <Gloss Language="grc">ζξχςβνμ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="rr" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dd" Homograph="1" />
+      <Entry>
+        <Sense Id="FqlEVpe2">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ff" Homograph="1" />
+      <Entry>
+        <Sense Id="vhHQMiMl">
+          <Gloss Language="grc">υἱός</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="a b" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="ww ee" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="ww ee rr" Homograph="1" />
+      <Entry>
+        <Sense Id="DtiBA0QY">
+          <Gloss Language="grc">φφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="eesfd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="eesfdsdf" Homograph="1" />
+      <Entry>
+        <Sense Id="neiv4Hhn">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="wwee" Homograph="1" />
+      <Entry>
+        <Sense Id="EcGakHfQ">
+          <Gloss Language="grc">ερ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ww" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ee" Homograph="1" />
+      <Entry>
+        <Sense Id="uYpD+7tJ">
+          <Gloss Language="grc">σφδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="wweesf" Homograph="1" />
+      <Entry>
+        <Sense Id="dmkjKXWI">
+          <Gloss Language="grc">σφδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="wweee" Homograph="1" />
+      <Entry>
+        <Sense Id="VDKGRw+E">
+          <Gloss Language="grc">αα</Gloss>
+        </Sense>
+        <Sense Id="BCrDNp3P">
+          <Gloss Language="grc">σσσ</Gloss>
+        </Sense>
+        <Sense Id="WFVKudT6">
+          <Gloss Language="grc">δδδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="e" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ee" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="e" Homograph="1" />
+      <Entry>
+        <Sense Id="O2I9U7I+">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="oWVC4Z9w">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+        <Sense Id="hfa5f0+E">
+          <Gloss Language="en">-e</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="ww ee rr ww" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="rr" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="-ed" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="-ing" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="rraa" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="rraabb" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="b" Homograph="1" />
+      <Entry>
+        <Sense Id="X0ohoBS3">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="JkylXA9j">
+          <Gloss Language="grc">δσ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="b" Homograph="1" />
+      <Entry>
+        <Sense Id="al6aeGlg">
+          <Gloss Language="grc">εεερε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ttsf" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ttsfdfg" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ef" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="-ef" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="f" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ttsfe" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="start" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="infix" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="stemendstem" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="suffix" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="fsdf" Homograph="1" />
+      <Entry>
+        <Sense Id="miCmxjBP">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="y5yNmdtQ">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="+WSVZ5in">
+          <Gloss Language="en">ffff</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="the heavens" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="in the beginning" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="aa bb cc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="bb cc" Homograph="1" />
+      <Entry>
+        <Sense Id="5jUN5ara">
+          <Gloss Language="grc">ηι</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="bb cc dd" Homograph="1" />
+      <Entry>
+        <Sense Id="Zt/AN/2F">
+          <Gloss Language="grc">αβχδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="qqq www" Homograph="1" />
+      <Entry>
+        <Sense Id="Xuzlqfde">
+          <Gloss Language="grc">θω</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="qqq www eee" Homograph="1" />
+      <Entry>
+        <Sense Id="i1irVOlf">
+          <Gloss Language="grc">θωε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="yyy uuu" Homograph="1" />
+      <Entry>
+        <Sense Id="jDTdJ/jA">
+          <Gloss Language="grc">σ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="yyy uuu iii" Homograph="1" />
+      <Entry>
+        <Sense Id="Fe9x/Jpe">
+          <Gloss Language="grc">δδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="ddd fff" Homograph="1" />
+      <Entry>
+        <Sense Id="w2Xtjq9h">
+          <Gloss Language="grc">δδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dog" Homograph="1" />
+      <Entry>
+        <Sense Id="p5Zpxtr2">
+          <Gloss Language="grc">δογ</Gloss>
+        </Sense>
+        <Sense Id="3yOBPF6M">
+          <Gloss Language="grc">φ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="mouse rabbit" Homograph="1" />
+      <Entry>
+        <Sense Id="BfF1WA8R">
+          <Gloss Language="grc">μουσε ραββιτ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="dog mouse rabbit" Homograph="1" />
+      <Entry>
+        <Sense Id="j26F/WY7">
+          <Gloss Language="grc">δογ μουσε ραββιτ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="a donkey" Homograph="1" />
+      <Entry>
+        <Sense Id="FaSZ0EUQ">
+          <Gloss Language="grc">α δονκεψ</Gloss>
+        </Sense>
+        <Sense Id="N/cQ38oC">
+          <Gloss Language="grc">α φιση</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="big green house" Homograph="1" />
+      <Entry>
+        <Sense Id="zObBbJ2D">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="very big" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="mouse" Homograph="1" />
+      <Entry>
+        <Sense Id="yB1p/t8k">
+          <Gloss Language="grc">μουσε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="rabbit" Homograph="1" />
+      <Entry>
+        <Sense Id="88dpZmiM">
+          <Gloss Language="grc">ραββιτ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="small dog" Homograph="1" />
+      <Entry>
+        <Sense Id="r4nj9A8z">
+          <Gloss Language="grc">σμαλλ δογγψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="asdf" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ghjkl" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="a" Homograph="1" />
+      <Entry>
+        <Sense Id="m2z9yYHN">
+          <Gloss Language="en">-e</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="aaa" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="bbb" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ccc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="vvv" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="aa" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="cc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="aabbcc aabbcc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ff" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="zz" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="qq" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="tttt" Homograph="1" />
+      <Entry>
+        <Sense Id="shfRgRe0">
+          <Gloss Language="grc">φ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="c" Homograph="1" />
+      <Entry>
+        <Sense Id="mPCvDkeU">
+          <Gloss Language="grc">χ</Gloss>
+        </Sense>
+        <Sense Id="LJO2Q8+4">
+          <Gloss Language="grc">δφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="cccc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ing" Homograph="1" />
+      <Entry>
+        <Sense Id="23cGqVX2">
+          <Gloss Language="grc">ινγ</Gloss>
+        </Sense>
+        <Sense Id="5LXAYmJQ">
+          <Gloss Language="grc">φφ</Gloss>
+        </Sense>
+        <Sense Id="tm8gEgHH">
+          <Gloss Language="grc">φφφφ</Gloss>
+        </Sense>
+        <Sense Id="vhAOjRLM">
+          <Gloss Language="pt">Hello</Gloss>
+        </Sense>
+        <Sense Id="iF7p009J">
+          <Gloss Language="en">day</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="third" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="last" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="pp" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="hello" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="helloing" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ten" Homograph="1" />
+      <Entry>
+        <Sense Id="tPMdSB+q">
+          <Gloss Language="en">Nine</Gloss>
+        </Sense>
+        <Sense Id="lPgwzIsG">
+          <Gloss Language="grc">Νινε</Gloss>
+        </Sense>
+        <Sense Id="tbuRMVij">
+          <Gloss Language="en">Nine</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="test this" Homograph="1" />
+      <Entry>
+        <Sense Id="sM6iAKBw">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sdfsd" Homograph="1" />
+      <Entry>
+        <Sense Id="4F5z34ds">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dfdj" Homograph="1" />
+      <Entry>
+        <Sense Id="48l69Cvc">
+          <Gloss Language="grc">gφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dfgdfg" Homograph="1" />
+      <Entry>
+        <Sense Id="JtBoi6vo">
+          <Gloss Language="grc">δφγδφγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="q" Homograph="1" />
+      <Entry>
+        <Sense Id="jROBErTd">
+          <Gloss Language="en">q</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="alpha" Homograph="1" />
+      <Entry>
+        <Sense Id="LblFO1D1">
+          <Gloss Language="grc">αλπηα</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dearly" Homograph="1" />
+      <Entry>
+        <Sense Id="eDwbL8iD">
+          <Gloss Language="en">Dearly</Gloss>
+        </Sense>
+        <Sense Id="dxPLN1mp">
+          <Gloss Language="pt">Test</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="more" Homograph="1" />
+      <Entry>
+        <Sense Id="0Sg6lDsC">
+          <Gloss Language="en">less</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="changes" Homograph="1" />
+      <Entry>
+        <Sense Id="nhfR2jzO">
+          <Gloss Language="en">no change</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="a b c d" Homograph="1" />
+      <Entry>
+        <Sense Id="d1zUXit2">
+          <Gloss Language="grc">τηισ τηινγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="the cat sat" Homograph="1" />
+      <Entry>
+        <Sense Id="0VgECDNY">
+          <Gloss Language="grc">τρυλψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="red squirrel" Homograph="1" />
+      <Entry>
+        <Sense Id="LI/hmNmB">
+          <Gloss Language="grc">ρεδ σθυιρρελ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="red" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="squirrel" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="en" Homograph="1" />
+      <Entry>
+        <Sense Id="Gcaksnsu">
+          <Gloss Language="grc">ιν</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="trust" Homograph="1" />
+      <Entry>
+        <Sense Id="0mmqmfOd">
+          <Gloss Language="grc">το βελιεςε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dfdfddf" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dfdf" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ddf" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dfd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="fddf" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dfdfddf" Homograph="1" />
+      <Entry>
+        <Sense Id="pQI/xU+0">
+          <Gloss Language="grc">Biγ</Gloss>
+        </Sense>
+        <Sense Id="KOc7QlmN">
+          <Gloss Language="grc">Biγ &amp;hhhhhbbbb</Gloss>
+        </Sense>
+        <Sense Id="8QTEAge6">
+          <Gloss Language="grc">Biγ &amp;hhhhhbbbb yhhhgg</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="d" Homograph="1" />
+      <Entry>
+        <Sense Id="S8asx9yv">
+          <Gloss Language="en">b-</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="fd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="sdfsdfsdf" Homograph="1" />
+      <Entry>
+        <Sense Id="inYlYaNs">
+          <Gloss Language="grc">Huγ</Gloss>
+        </Sense>
+        <Sense Id="NU0JdsyD">
+          <Gloss Language="grc">Huγhhh</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="asd" Homograph="1" />
+      <Entry>
+        <Sense Id="iKtywJLD">
+          <Gloss Language="grc">Hgy</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="try" Homograph="1" />
+      <Entry>
+        <Sense Id="eYF8Heyt">
+          <Gloss Language="grc">ΤΡΨ</Gloss>
+        </Sense>
+        <Sense Id="QHf7gLOF">
+          <Gloss Language="tpi">sdfs</Gloss>
+        </Sense>
+        <Sense Id="kZ39GbVL">
+          <Gloss Language="tpi">sdfssfd</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dis" Homograph="1" />
+      <Entry>
+        <Sense Id="leT5JTXJ">
+          <Gloss Language="grc">ΔΙΣ</Gloss>
+        </Sense>
+        <Sense Id="D0StDpIs">
+          <Gloss Language="tpi">sdfsdf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="dfsdf tomas" Homograph="1" />
+      <Entry>
+        <Sense Id="VR4hXibS">
+          <Gloss Language="grc">πηρασε</Gloss>
+        </Sense>
+        <Sense Id="ARGTcvDu">
+          <Gloss Language="grc">Father</Gloss>
+        </Sense>
+        <Sense Id="njeuOoJd">
+          <Gloss Language="grc">father</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="windows" Homograph="1" />
+      <Entry>
+        <Sense Id="YfpIeI2C">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="oTr4IG5B">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="9ua3wYig">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="fSeD8Qp6">
+          <Gloss Language="grc"></Gloss>
+        </Sense>
+        <Sense Id="oM28OsSn">
+          <Gloss Language="grc">δδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="left" Homograph="1" />
+      <Entry>
+        <Sense Id="8NERYCpm">
+          <Gloss Language="grc">sdfδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="new" Homograph="1" />
+      <Entry>
+        <Sense Id="zVP4TKtK">
+          <Gloss Language="tpi">sfd</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="sdfsd" Homograph="1" />
+      <Entry>
+        <Sense Id="zdWeXws1">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="nHMvaHCu">
+          <Gloss Language="grc">Αβχ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="fdsf" Homograph="1" />
+      <Entry>
+        <Sense Id="3uspVu2j">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="+w1QD+yu">
+          <Gloss Language="grc">αβχ</Gloss>
+        </Sense>
+        <Sense Id="r1MOcQ/K">
+          <Gloss Language="en">fdsdf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ct" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="a-c" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="t" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="te" Homograph="1" />
+      <Entry>
+        <Sense Id="kBBBqmYT">
+          <Gloss Language="en">be</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="xt" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="t-ext" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="t-e" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="Dea" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="rly" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="Dearly" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="De" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="arly" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="Dearl" Homograph="1" />
+      <Entry>
+        <Sense Id="giYjyUr7">
+          <Gloss Language="en">dear</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="y" Homograph="1" />
+      <Entry>
+        <Sense Id="z+TVrr/P">
+          <Gloss Language="en">-i</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="Dear" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ly" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="De" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="a-r" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="st" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="test" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="t" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="es" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="est" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="text" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="tex" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ac" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="Jes-us" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="o" Homograph="1" />
+      <Entry>
+        <Sense Id="GvJ28aQS">
+          <Gloss Language="grc">σφ</Gloss>
+        </Sense>
+        <Sense Id="KEWTZb1A">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+        <Sense Id="ceRCYAvD">
+          <Gloss Language="en">a</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="j" Homograph="1" />
+      <Entry>
+        <Sense Id="TKqdnOs4">
+          <Gloss Language="en">-w</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="sdfs" Homograph="1" />
+      <Entry>
+        <Sense Id="93TZzQ/i">
+          <Gloss Language="en">sdfs</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="df" Homograph="1" />
+      <Entry>
+        <Sense Id="prYQcJEY">
+          <Gloss Language="en">-bv</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="s-d-f" Homograph="1" />
+      <Entry>
+        <Sense Id="8CNbqoRc">
+          <Gloss Language="en">sdf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="abc" Homograph="1" />
+      <Entry>
+        <Sense Id="jtoPryEQ">
+          <Gloss Language="en">abc</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="abcabc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ab" Homograph="1" />
+      <Entry>
+        <Sense Id="zYttwqJ8">
+          <Gloss Language="en">ba</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="c" Homograph="1" />
+      <Entry>
+        <Sense Id="CH3+BvR+">
+          <Gloss Language="grc">φ</Gloss>
+        </Sense>
+        <Sense Id="l7arrJ1L">
+          <Gloss Language="grc">ε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="abab" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="C" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="cc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="iho" Homograph="1" />
+      <Entry>
+        <Sense Id="pl03hM3U">
+          <Gloss Language="grc">α</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="upa" Homograph="1" />
+      <Entry>
+        <Sense Id="YnPyBMy2">
+          <Gloss Language="grc">β</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="th" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="the" Homograph="1" />
+      <Entry>
+        <Sense Id="cSnYzy10">
+          <Gloss Language="grc">σφ</Gloss>
+        </Sense>
+        <Sense Id="MI/tKfE+">
+          <Gloss Language="en">the</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="t" Homograph="1" />
+      <Entry>
+        <Sense Id="trLoldOu">
+          <Gloss Language="grc">τ</Gloss>
+        </Sense>
+        <Sense Id="htsyXk1N">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+        <Sense Id="T2Z3ZA5p">
+          <Gloss Language="grc">σδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="a+tqrlCK">
+          <Gloss Language="grc">σδφσδφδφ</Gloss>
+        </Sense>
+        <Sense Id="IjTqO+UT">
+          <Gloss Language="grc">σδφσδφδφδδ</Gloss>
+        </Sense>
+        <Sense Id="smgIryGd">
+          <Gloss Language="grc">σδφσδφδφδδφ</Gloss>
+        </Sense>
+        <Sense Id="OoCoOLmf">
+          <Gloss Language="grc">σδφσδφδφδδφσδφ</Gloss>
+        </Sense>
+        <Sense Id="Sfgrnx2l">
+          <Gloss Language="grc">σδφσδφδφδδφσδφδδ</Gloss>
+        </Sense>
+        <Sense Id="gLTGWzqe">
+          <Gloss Language="grc">σδφσδφδφδδφσδφδδδφ</Gloss>
+        </Sense>
+        <Sense Id="6RN0tMEq">
+          <Gloss Language="grc">σδφσδφδφδδφσδφδδδφφφ</Gloss>
+        </Sense>
+        <Sense Id="KnCC+5Qg">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφ</Gloss>
+        </Sense>
+        <Sense Id="66gLCVss">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδδ</Gloss>
+        </Sense>
+        <Sense Id="InwNHd/A">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδddδδ</Gloss>
+        </Sense>
+        <Sense Id="/n2RP0yP">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδddδδεε</Gloss>
+        </Sense>
+        <Sense Id="5SSgonRE">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδddδδεεσδφ</Gloss>
+        </Sense>
+        <Sense Id="sZBsSKeY">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδddδδεεσδφδδ</Gloss>
+        </Sense>
+        <Sense Id="L/rJIybX">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδddδδεεσδeφδδ</Gloss>
+        </Sense>
+        <Sense Id="nRtEznjx">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδddδδεεσδeφδδφφ</Gloss>
+        </Sense>
+        <Sense Id="6xtaqc8e">
+          <Gloss Language="grc">σδφσδφδφδδφσδφdddδδδφφφδddδδεεσδeφδδφφγγγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="eff" Homograph="1" />
+      <Entry>
+        <Sense Id="IrWfr0Q+">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dsf" Homograph="1" />
+      <Entry>
+        <Sense Id="8I+ikODp">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="is" Homograph="1" />
+      <Entry>
+        <Sense Id="q7T8J2HX">
+          <Gloss Language="grc">ισ</Gloss>
+        </Sense>
+        <Sense Id="4ir1SX+t">
+          <Gloss Language="en">huss</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="my" Homograph="1" />
+      <Entry>
+        <Sense Id="bg5wmxG+">
+          <Gloss Language="grc">μψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="thisismyword" Homograph="1" />
+      <Entry>
+        <Sense Id="MITArJVW">
+          <Gloss Language="grc">τηισισμψωορδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="sat" Homograph="1" />
+      <Entry>
+        <Sense Id="d/Eyc+0D">
+          <Gloss Language="grc">σfδ</Gloss>
+        </Sense>
+        <Sense Id="l6vZTxP9">
+          <Gloss Language="en">sdf</Gloss>
+        </Sense>
+        <Sense Id="ww+NgeWe">
+          <Gloss Language="en">SAT</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="ung" Homograph="1" />
+      <Entry>
+        <Sense Id="cubpvgTy">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="o" Homograph="1" />
+      <Entry>
+        <Sense Id="W+VUUDev">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="n" Homograph="1" />
+      <Entry>
+        <Sense Id="fcBUmj2C">
+          <Gloss Language="grc">σφδ</Gloss>
+        </Sense>
+        <Sense Id="1uMftnnz">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="on the" Homograph="1" />
+      <Entry>
+        <Sense Id="ZO5HXIa2">
+          <Gloss Language="grc">σδφsδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="mat" Homograph="1" />
+      <Entry>
+        <Sense Id="zwtbnL7A">
+          <Gloss Language="en">fat</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="and" Homograph="1" />
+      <Entry>
+        <Sense Id="z0oArKvx">
+          <Gloss Language="en">and</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="we" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="very" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="edrr" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ababc" Homograph="1" />
+      <Entry>
+        <Sense Id="ZSdhAq8S">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="the cat sat on the" Homograph="1" />
+      <Entry>
+        <Sense Id="jUOsm/YV">
+          <Gloss Language="grc">σφδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="f" Homograph="1" />
+      <Entry>
+        <Sense Id="eFrRDfP3">
+          <Gloss Language="en">f</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="r" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="g" Homograph="1" />
+      <Entry>
+        <Sense Id="7/FwHcyv">
+          <Gloss Language="grc">γγγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="po" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="lar" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="pop" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="E" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="pic" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="car" Homograph="1" />
+      <Entry>
+        <Sense Id="SffqEAOr">
+          <Gloss Language="grc">ςαρ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="bike" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="bike" Homograph="1" />
+      <Entry>
+        <Sense Id="NRbQvyxD">
+          <Gloss Language="grc">μψβικινγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="so" Homograph="1" />
+      <Entry>
+        <Sense Id="4EDXP/0f">
+          <Gloss Language="grc">σοσο</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="frog" Homograph="1" />
+      <Entry>
+        <Sense Id="cA9QaErJ">
+          <Gloss Language="grc">φρομγ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="van" Homograph="1" />
+      <Entry>
+        <Sense Id="HkLaI2WB">
+          <Gloss Language="grc">ςαν</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="qqqq" Homograph="1" />
+      <Entry>
+        <Sense Id="ph+r9Pwv">
+          <Gloss Language="grc">θθ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="qw" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="kk" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ll" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="fffsds" Homograph="1" />
+      <Entry>
+        <Sense Id="IAml8wqL">
+          <Gloss Language="grc">φ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="kkkk" Homograph="1" />
+      <Entry>
+        <Sense Id="6H+75q12">
+          <Gloss Language="grc">σfδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="gg" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ss" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="d" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dddd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ddd" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="wer" Homograph="1" />
+      <Entry>
+        <Sense Id="OBuzcFeh">
+          <Gloss Language="grc">ωερ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="werwer" Homograph="1" />
+      <Entry>
+        <Sense Id="9Kue/Zpl">
+          <Gloss Language="grc">ωερωερ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="wer" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="werwering" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="werwerwer" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ly" Homograph="1" />
+      <Entry>
+        <Sense Id="Ygy6BpZR">
+          <Gloss Language="grc">λψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="lastlyyyyyyyyyying" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="abctoma" Homograph="1" />
+      <Entry>
+        <Sense Id="CIGzTiA1">
+          <Gloss Language="grc">σομεγλοσσ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="tom" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="B" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="lap" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="top" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="mini" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="computer" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="minicomputer" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="fri" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dge" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="-less" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="obe" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="dia" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="per" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="none" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ok" Homograph="1" />
+      <Entry>
+        <Sense Id="4HerhP/k">
+          <Gloss Language="en">uk</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="microc" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="omputer" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ve" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ry" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Prefix" Form="the" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="before" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="a" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ct" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="after" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="sat" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="world" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="hellocat" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="worldi" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="cat" Homograph="1" />
+      <Entry>
+        <Sense Id="GSPv9aRP">
+          <Gloss Language="en">Cat</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="happy" Homograph="1" />
+      <Entry>
+        <Sense Id="EtAHF/eH">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="ing" Homograph="1" />
+      <Entry>
+        <Sense Id="ZZkKRa/4">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="h" Homograph="1" />
+      <Entry>
+        <Sense Id="bmuy2kIj">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="wa" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="frogg" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="froggy" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="g" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="frog" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="froggyy" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Suffix" Form="yy" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="hous" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="house house" Homograph="1" />
+      <Entry>
+        <Sense Id="+C/zpo8h">
+          <Gloss Language="grc">sδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="house" Homograph="1" />
+      <Entry>
+        <Sense Id="gZ83eA5G">
+          <Gloss Language="grc">σδφ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="house house house" Homograph="1" />
+      <Entry>
+        <Sense Id="h49dgtoV">
+          <Gloss Language="grc">δδδ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Infix" Form="ho" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="hh" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="go to" Homograph="1" />
+      <Entry>
+        <Sense Id="dkjw6nvP">
+          <Gloss Language="grc">γο το</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="go" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Stem" Form="you" Homograph="1" />
+      <Entry />
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="stuff" Homograph="1" />
+      <Entry>
+        <Sense Id="9FinUnBF">
+          <Gloss Language="grc">ηελλο</Gloss>
+        </Sense>
+        <Sense Id="dyke5/hD">
+          <Gloss Language="en">stuff</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="tomas" Homograph="1" />
+      <Entry>
+        <Sense Id="Ui6qogLT">
+          <Gloss Language="grc">Thε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="faadd stuff sdf dfsdf tomas کراݩو چاہویں" Homograph="1" />
+      <Entry>
+        <Sense Id="Su5+fKf7">
+          <Gloss Language="grc">Thε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="کراݩو چاہویں" Homograph="1" />
+      <Entry>
+        <Sense Id="aX9SsgFl">
+          <Gloss Language="grc">Thε</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="add" Homograph="1" />
+      <Entry>
+        <Sense Id="IVhf3w9A">
+          <Gloss Language="en">Gh</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="content" Homograph="1" />
+      <Entry>
+        <Sense Id="MU5nUbHx">
+          <Gloss Language="en">Yf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Phrase" Form="qwe qwe qwe" Homograph="1" />
+      <Entry>
+        <Sense Id="288tKc7j">
+          <Gloss Language="grc">τεμποραραψ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="entered" Homograph="1" />
+      <Entry>
+        <Sense Id="yAtlhIvQ">
+          <Gloss Language="grc">εντερεδ</Gloss>
+        </Sense>
+        <Sense Id="IgMbpf6/">
+          <Gloss Language="grc">εντερεδaabb</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="there" Homograph="1" />
+      <Entry>
+        <Sense Id="NSTnhBMt">
+          <Gloss Language="grc">this</Gloss>
+        </Sense>
+        <Sense Id="kUkFb3FQ">
+          <Gloss Language="grc">τηατ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="synagogue" Homograph="1" />
+      <Entry>
+        <Sense Id="NdqGM3hQ">
+          <Gloss Language="grc">σνερτετ</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="with" Homograph="1" />
+      <Entry>
+        <Sense Id="HAXQJ0BB">
+          <Gloss Language="grc">ωιτη</Gloss>
+        </Sense>
+        <Sense Id="mm9EzY7G">
+          <Gloss Language="en">wit</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="you" Homograph="1" />
+      <Entry>
+        <Sense Id="PqP2zdpp">
+          <Gloss Language="en">You</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="stupid" Homograph="1" />
+      <Entry>
+        <Sense Id="9UEpE9rB">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="galatians" Homograph="1" />
+      <Entry>
+        <Sense Id="Mw6DGqYs">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="must" Homograph="1" />
+      <Entry>
+        <Sense Id="XMu3xzmO">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="been" Homograph="1" />
+      <Entry>
+        <Sense Id="oPdGTyN4">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="bweitched" Homograph="1" />
+      <Entry>
+        <Sense Id="pcPBpyvD">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="whose" Homograph="1" />
+      <Entry>
+        <Sense Id="A7umoQHt">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="eyse" Homograph="1" />
+      <Entry>
+        <Sense Id="98h5rubM">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="christ" Homograph="1" />
+      <Entry>
+        <Sense Id="3K/u1wcJ">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="openly" Homograph="1" />
+      <Entry>
+        <Sense Id="cQawYkmt">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="displayed" Homograph="1" />
+      <Entry>
+        <Sense Id="OYyeAhwm">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="upon" Homograph="1" />
+      <Entry>
+        <Sense Id="d/3EUv57">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="his" Homograph="1" />
+      <Entry>
+        <Sense Id="wBdTB39j">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="cross" Homograph="1" />
+      <Entry>
+        <Sense Id="qWkExufg">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="not" Homograph="1" />
+      <Entry>
+        <Sense Id="gYzmLvL1">
+          <Gloss Language="en"></Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="n" Homograph="1" />
+      <Entry>
+        <Sense Id="goFz6zdC">
+          <Gloss Language="en">NNN</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ze" Homograph="1" />
+      <Entry>
+        <Sense Id="Xq5gr7zF">
+          <Gloss Language="en">the</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="kat" Homograph="1" />
+      <Entry>
+        <Sense Id="waj140Di">
+          <Gloss Language="en">cat</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="la" Homograph="1" />
+      <Entry>
+        <Sense Id="A7eJxbo7">
+          <Gloss Language="en">la</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="lal" Homograph="1" />
+      <Entry>
+        <Sense Id="IDocAcQg">
+          <Gloss Language="en">oo</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ala" Homograph="1" />
+      <Entry>
+        <Sense Id="sWxMUTFi">
+          <Gloss Language="en">qqq</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="zokay" Homograph="1" />
+      <Entry>
+        <Sense Id="hlxVk5A7">
+          <Gloss Language="en">OkaY</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="mam" Homograph="1" />
+      <Entry>
+        <Sense Id="PX7DgOdZ">
+          <Gloss Language="en">ddd</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ok" Homograph="1" />
+      <Entry>
+        <Sense Id="BPhh8pk6">
+          <Gloss Language="en">OK</Gloss>
+        </Sense>
+        <Sense Id="c+tP8+/N">
+          <Gloss Language="en">we</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="cdc" Homograph="1" />
+      <Entry>
+        <Sense Id="PfMzFp0e">
+          <Gloss Language="en">sdf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="aokaybe" Homograph="1" />
+      <Entry>
+        <Sense Id="aP/nj3xB">
+          <Gloss Language="pt">qqqqqqqqqqqqqqqqqq</Gloss>
+        </Sense>
+        <Sense Id="MrxUQ/f7">
+          <Gloss Language="en">huh</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="huh" Homograph="1" />
+      <Entry>
+        <Sense Id="bFqI5h9h">
+          <Gloss Language="en">huh</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="can" Homograph="1" />
+      <Entry>
+        <Sense Id="C3gU9RhU">
+          <Gloss Language="en">can</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="speak" Homograph="1" />
+      <Entry>
+        <Sense Id="AAWXwQV7">
+          <Gloss Language="en">make sound</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="what" Homograph="1" />
+      <Entry>
+        <Sense Id="TM417MV+">
+          <Gloss Language="en">huh</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="cause" Homograph="1" />
+      <Entry>
+        <Sense Id="7mZYV8JL">
+          <Gloss Language="en">er</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="of" Homograph="1" />
+      <Entry>
+        <Sense Id="/WVJJYBH">
+          <Gloss Language="en">sdf</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="abe" Homograph="1" />
+      <Entry>
+        <Sense Id="tvoFh4l5">
+          <Gloss Language="en">t</Gloss>
+        </Sense>
+        <Sense Id="4OhxMqdn">
+          <Gloss Language="en">baa</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="تمان" Homograph="1" />
+      <Entry>
+        <Sense Id="JA1+30zD">
+          <Gloss Language="en">hhj</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="tomas𝔓" Homograph="1" />
+      <Entry>
+        <Sense Id="JaAp8ppA">
+          <Gloss Language="en">yy</Gloss>
+        </Sense>
+        <Sense Id="mJqjbL4I">
+          <Gloss Language="en">hg</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="okay" Homograph="1" />
+      <Entry>
+        <Sense Id="m/dJp1PU">
+          <Gloss Language="en">ukei</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="x" Homograph="1" />
+      <Entry>
+        <Sense Id="guH28APY">
+          <Gloss Language="en">ech</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="note" Homograph="1" />
+      <Entry>
+        <Sense Id="ddMG/pnJ">
+          <Gloss Language="en">not</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="faadd" Homograph="1" />
+      <Entry>
+        <Sense Id="4GryK1BC">
+          <Gloss Language="en">fad</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dfsdf" Homograph="1" />
+      <Entry>
+        <Sense Id="owZ41UQ6">
+          <Gloss Language="en">beef</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="tookaymas𝔓" Homograph="1" />
+      <Entry>
+        <Sense Id="fTVcq9yO">
+          <Gloss Language="en">hmm</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="کراݩو" Homograph="1" />
+      <Entry>
+        <Sense Id="cKejZSAA">
+          <Gloss Language="en">huh</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="چاہویں" Homograph="1" />
+      <Entry>
+        <Sense Id="+3crR6Y/">
+          <Gloss Language="en">huh</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="ffffffffffff" Homograph="1" />
+      <Entry>
+        <Sense Id="zcDFxEid">
+          <Gloss Language="en">f</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="df" Homograph="1" />
+      <Entry>
+        <Sense Id="6AsBnMQ5">
+          <Gloss Language="en">beef</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="dfdsf" Homograph="1" />
+      <Entry>
+        <Sense Id="xLL/Th1K">
+          <Gloss Language="en">beffeded</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+    <item>
+      <Lexeme Type="Word" Form="unjjiverse" Homograph="1" />
+      <Entry>
+        <Sense Id="FE33NkYk">
+          <Gloss Language="en">universidad</Gloss>
+        </Sense>
+      </Entry>
+    </item>
+  </Entries>
+</Lexicon>

From e2337c231281f81164a5092e2ab5c1edd1d0d168 Mon Sep 17 00:00:00 2001
From: alex-rawlings-yyc <alex.rawlings@wycliffe.ca>
Date: Sat, 21 Feb 2026 15:33:23 -0700
Subject: [PATCH 8/8] Refactor interlinearizer WebView and enhance paratext9
 converter tests

- Update the interlinearizer WebView to return `undefined` instead of `result` for better clarity in async handling.
- Simplify gloss lookup handling in `createAnalyses` by removing unnecessary nullish coalescing.
- Add a new test to ensure deterministic sorting of items with the same index by length and kind in the paratext9 converter.
- Improve error handling tests in the paratext9 parser for missing attributes in XML data.
---
 .../paratext-9/paratext9Converter.test.ts     | 39 +++++++++++++++++++
 .../paratext-9/paratext9Parser.test.ts        |  4 +-
 src/interlinearizer.web-view.tsx              |  4 +-
 src/parsers/paratext-9/lexiconParser.ts       | 18 +++++----
 src/parsers/paratext-9/paratext9Converter.ts  |  8 +++-
 5 files changed, 62 insertions(+), 11 deletions(-)

diff --git a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
index 4edb4d1..af8acb5 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Converter.test.ts
@@ -253,6 +253,45 @@ describe('convertParatext9ToInterlinearization', () => {
       expect(result.books[0].textVersion).toBe(expectedTextVersionForSingleHash('ABC123'));
       expect(result.books[0].segments[0].occurrences[0].assignments[0].status).toBe('approved');
     });
+
+    it('sorts items with same index by length then by kind (deterministic tie-break)', async () => {
+      const data: InterlinearData = {
+        glossLanguage: 'en',
+        bookId: 'MAT',
+        verses: {
+          'MAT 1:1': {
+            hash: '',
+            clusters: [
+              {
+                textRange: { index: 0, length: 2 },
+                lexemes: [{ lexemeId: 'Word:ab', senseId: '' }],
+                lexemesId: 'Word:ab',
+                id: 'Word:ab/0-2',
+                excluded: false,
+              },
+              {
+                textRange: { index: 0, length: 1 },
+                lexemes: [{ lexemeId: 'Word:a', senseId: '' }],
+                lexemesId: 'Word:a',
+                id: 'Word:a/0-1',
+                excluded: false,
+              },
+            ],
+            punctuations: [{ textRange: { index: 0, length: 1 }, beforeText: ',', afterText: ',' }],
+          },
+        },
+      };
+      const result = await convertParatext9ToInterlinearization(data, nodeHashOptions);
+
+      const { occurrences } = result.books[0].segments[0];
+      expect(occurrences).toHaveLength(3);
+      expect(occurrences[0].anchor).toBe('0-1');
+      expect(occurrences[0].type).toBe('word');
+      expect(occurrences[1].anchor).toBe('0-1');
+      expect(occurrences[1].type).toBe('punctuation');
+      expect(occurrences[2].anchor).toBe('0-2');
+      expect(occurrences[2].type).toBe('word');
+    });
   });
 
   describe('assignment status from verse hash', () => {
diff --git a/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
index b511ad5..347b5bc 100644
--- a/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
+++ b/src/__tests__/parsers/paratext-9/paratext9Parser.test.ts
@@ -690,7 +690,7 @@ describe('Paratext9Parser', () => {
       );
     });
 
-    it('throws when Range is missing Index or Length', () => {
+    it('throws when Range is missing Index', () => {
       const xmlNoIndex = `
         <InterlinearData GlossLanguage="en" BookId="MAT">
           <Verses>
@@ -709,7 +709,9 @@ describe('Paratext9Parser', () => {
       expect(() => parser.parse(xmlNoIndex)).toThrow(
         'Invalid XML: Range missing required Index or Length attributes',
       );
+    });
 
+    it('throws when Range is missing Length', () => {
       const xmlNoLength = `
         <InterlinearData GlossLanguage="en" BookId="MAT">
           <Verses>
diff --git a/src/interlinearizer.web-view.tsx b/src/interlinearizer.web-view.tsx
index 29af712..0843e56 100644
--- a/src/interlinearizer.web-view.tsx
+++ b/src/interlinearizer.web-view.tsx
@@ -152,7 +152,7 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
           setInterlinearization(result);
           setConversionSettled(true);
         }
-        return result;
+        return undefined;
       })
       .catch(() => {
         if (!cancelled) {
@@ -176,7 +176,7 @@ globalThis.webViewComponent = function InterlinearizerWebView() {
 
   /** Analyses map derived from parsed data (ID → Analysis); only defined when parsed exists. */
   const analysesMap = useMemo(
-    () => (parsed ? createAnalyses(parsed, { glossLookup: glossLookup ?? undefined }) : undefined),
+    () => (parsed ? createAnalyses(parsed, { glossLookup }) : undefined),
     [parsed, glossLookup],
   );
 
diff --git a/src/parsers/paratext-9/lexiconParser.ts b/src/parsers/paratext-9/lexiconParser.ts
index dce95e7..561e065 100644
--- a/src/parsers/paratext-9/lexiconParser.ts
+++ b/src/parsers/paratext-9/lexiconParser.ts
@@ -15,9 +15,9 @@ const GLOSS_KEY_SEP = '\t';
 const DEFAULT_LANGUAGE = '*';
 
 /**
- * Lookup function: (senseId, language) → gloss text when present in the Lexicon. Return value is
- * trimmed; empty string is returned for missing or blank glosses when the sense exists, so callers
- * can distinguish "no entry" (undefined) from "entry with no text" ("").
+ * Lookup function: (senseId, language) → gloss text when present in the Lexicon. Empty string is
+ * returned for missing or blank glosses when the sense exists, so callers can distinguish "no
+ * entry" (undefined) from "entry with no text" ("").
  */
 export type LexiconGlossLookup = (senseId: string, language: string) => string | undefined;
 
@@ -40,7 +40,11 @@ interface ParsedEntry {
 
 /** Parsed Lexicon item: Lexeme and Entry. */
 interface ParsedLexiconItem {
-  Lexeme?: { ['@_Type']?: string; ['@_Form']?: string; ['@_Homograph']?: string };
+  Lexeme?: {
+    ['@_Type']?: string;
+    ['@_Form']?: string;
+    ['@_Homograph']?: string;
+  };
   Entry?: ParsedEntry;
 }
 
@@ -84,7 +88,7 @@ function glossKey(senseId: string, language: string): string {
  * Normalizes a single Gloss item from the parser into language and text.
  *
  * @param gloss - Single Gloss from ParsedSense.Gloss (object or string).
- * @returns Trimmed language (or {@link DEFAULT_LANGUAGE} when missing) and trimmed text.
+ * @returns Language (or {@link DEFAULT_LANGUAGE} when missing) and text.
  * @internal Exported so tests can cover the object branch when @_Language is undefined (parser
  *   may return a string for single Gloss with no attributes, so that branch is not reachable via XML).
  */
@@ -133,7 +137,7 @@ function glossPairsFromItem(item: ParsedLexiconItem): Array<{ key: string; text:
  * key.
  *
  * @param root - Parsed Lexicon root (Lexicon element).
- * @returns Map keyed by glossKey(senseId, language) to trimmed gloss text (empty string allowed).
+ * @returns Map keyed by glossKey(senseId, language) to gloss text (empty string allowed).
  */
 function buildGlossMap(root: ParsedLexiconRoot): Map<string, string> {
   const items = toArray(root.Entries?.item);
@@ -148,7 +152,7 @@ function buildGlossMap(root: ParsedLexiconRoot): Map<string, string> {
  * glosses.
  *
  * @param xml - Raw Lexicon XML string (e.g. file contents).
- * @returns A {@link LexiconGlossLookup} that returns the trimmed gloss string when the Lexicon has a
+ * @returns A {@link LexiconGlossLookup} that returns the gloss string when the Lexicon has a
  *   matching Sense and Gloss for that language, or undefined when no such entry exists. Returns the
  *   empty string when the Lexicon has a Sense+Language entry but the gloss text is blank.
  * @throws {Error} If the root element is not Lexicon.
diff --git a/src/parsers/paratext-9/paratext9Converter.ts b/src/parsers/paratext-9/paratext9Converter.ts
index a36014e..e2ce490 100644
--- a/src/parsers/paratext-9/paratext9Converter.ts
+++ b/src/parsers/paratext-9/paratext9Converter.ts
@@ -201,7 +201,13 @@ function convertVerseToSegment(
         punctuation,
       }),
     ),
-  ].sort((a, b) => a.textRange.index - b.textRange.index);
+  ].sort((a, b) => {
+    const byIndex = a.textRange.index - b.textRange.index;
+    if (byIndex !== 0) return byIndex;
+    const byLength = a.textRange.length - b.textRange.length;
+    if (byLength !== 0) return byLength;
+    return a.kind.localeCompare(b.kind);
+  });
 
   const occurrences: Occurrence[] = items.map((item, occurrenceIndex): Occurrence => {
     if (item.kind === 'cluster') {