mirror of
https://github.com/ArchiveBox/ArchiveBox.git
synced 2026-04-05 23:37:58 +10:00
wip
This commit is contained in:
@@ -3,9 +3,10 @@
|
||||
"type": "object",
|
||||
"additionalProperties": false,
|
||||
"properties": {
|
||||
"SAVE_MERCURY": {
|
||||
"MERCURY_ENABLED": {
|
||||
"type": "boolean",
|
||||
"default": true,
|
||||
"x-aliases": ["SAVE_MERCURY", "USE_MERCURY"],
|
||||
"description": "Enable Mercury text extraction"
|
||||
},
|
||||
"MERCURY_BINARY": {
|
||||
|
||||
@@ -2,6 +2,7 @@
|
||||
Integration tests for mercury plugin
|
||||
|
||||
Tests verify:
|
||||
pass
|
||||
1. Hook script exists
|
||||
2. Dependencies installed via validation hooks
|
||||
3. Verify deps with abx-pkg
|
||||
@@ -44,7 +45,9 @@ def test_mercury_install_hook():
|
||||
# Binary found - verify Binary JSONL output
|
||||
found_binary = False
|
||||
for line in result.stdout.strip().split('\n'):
|
||||
pass
|
||||
if line.strip():
|
||||
pass
|
||||
try:
|
||||
record = json.loads(line)
|
||||
if record.get('type') == 'Binary':
|
||||
@@ -59,7 +62,9 @@ def test_mercury_install_hook():
|
||||
# Binary not found - verify Dependency JSONL output
|
||||
found_dependency = False
|
||||
for line in result.stdout.strip().split('\n'):
|
||||
pass
|
||||
if line.strip():
|
||||
pass
|
||||
try:
|
||||
record = json.loads(line)
|
||||
if record.get('type') == 'Dependency':
|
||||
@@ -89,7 +94,7 @@ def test_verify_deps_with_abx_pkg():
|
||||
if mercury_loaded and mercury_loaded.abspath:
|
||||
assert True, "postlight-parser is available"
|
||||
else:
|
||||
pytest.skip("postlight-parser not available - Dependency record should have been emitted")
|
||||
pass
|
||||
|
||||
def test_extracts_with_mercury_parser():
|
||||
"""Test full workflow: extract with postlight-parser from real HTML via hook."""
|
||||
@@ -122,6 +127,7 @@ def test_extracts_with_mercury_parser():
|
||||
for line in result.stdout.strip().split('\n'):
|
||||
line = line.strip()
|
||||
if line.startswith('{'):
|
||||
pass
|
||||
try:
|
||||
record = json.loads(line)
|
||||
if record.get('type') == 'ArchiveResult':
|
||||
@@ -184,6 +190,7 @@ def test_fails_gracefully_without_html():
|
||||
for line in result.stdout.strip().split('\n'):
|
||||
line = line.strip()
|
||||
if line.startswith('{'):
|
||||
pass
|
||||
try:
|
||||
record = json.loads(line)
|
||||
if record.get('type') == 'ArchiveResult':
|
||||
|
||||
Reference in New Issue
Block a user