refactor(tests): use omniread public API instead of internal module imports
- Replace deep imports with top-level omniread exports in tests - Ensure tests validate only the supported public API surface - Align HTML and PDF tests with documented library usage
This commit is contained in:
@@ -4,10 +4,17 @@ import httpx
|
|||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
from jinja2 import Environment, BaseLoader
|
from jinja2 import Environment, BaseLoader
|
||||||
|
|
||||||
from omniread.core.content import ContentType
|
from omniread import (
|
||||||
from omniread.html.scraper import HTMLScraper
|
# core
|
||||||
from omniread.pdf.client import FileSystemPDFClient
|
ContentType,
|
||||||
from omniread.pdf.scraper import PDFScraper
|
|
||||||
|
# html
|
||||||
|
HTMLScraper,
|
||||||
|
|
||||||
|
# pdf
|
||||||
|
FileSystemPDFClient,
|
||||||
|
PDFScraper,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
MOCK_HTML_DIR = Path(__file__).parent / "mocks" / "html"
|
MOCK_HTML_DIR = Path(__file__).parent / "mocks" / "html"
|
||||||
|
|||||||
@@ -3,8 +3,13 @@ from typing import Optional
|
|||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
from bs4 import Tag
|
from bs4 import Tag
|
||||||
|
|
||||||
from omniread.html.parser import HTMLParser
|
from omniread import (
|
||||||
from omniread.core.content import Content
|
# core
|
||||||
|
Content,
|
||||||
|
|
||||||
|
# html
|
||||||
|
HTMLParser,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
class ParsedSimpleHTML(BaseModel):
|
class ParsedSimpleHTML(BaseModel):
|
||||||
|
|||||||
@@ -2,8 +2,13 @@ from typing import Optional
|
|||||||
|
|
||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
|
|
||||||
from omniread.html.parser import HTMLParser
|
from omniread import (
|
||||||
from omniread.core.content import Content
|
# core
|
||||||
|
Content,
|
||||||
|
|
||||||
|
# html
|
||||||
|
HTMLParser,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
class ParsedTableHTML(BaseModel):
|
class ParsedTableHTML(BaseModel):
|
||||||
|
|||||||
@@ -1,9 +1,13 @@
|
|||||||
from typing import Literal
|
from typing import Literal
|
||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
|
|
||||||
from omniread.pdf import PDFParser
|
from omniread import (
|
||||||
from omniread.core.content import Content
|
# core
|
||||||
|
Content,
|
||||||
|
|
||||||
|
# pdf
|
||||||
|
PDFParser,
|
||||||
|
)
|
||||||
|
|
||||||
class ParsedPDF(BaseModel):
|
class ParsedPDF(BaseModel):
|
||||||
size_bytes: int
|
size_bytes: int
|
||||||
|
|||||||
Reference in New Issue
Block a user