Files
MoFin/venv/lib/python3.12/site-packages/json_repair/parse_array.py
T
知微 fa45d8aa5f fix: 小果地址统一node122(兼容LAN+EasyTier)
- health_checklist.json: 192.168.1.122→node122
- ocr_client.py: docstring IP→node122
- docs/market-data-requirements.md: IP→node122
- 所有API调用通过ProxyHandler({})绕过系统代理
  Privoxy对node122:18003返回500,直连正常
2026-06-30 02:56:35 +08:00

113 lines
4.8 KiB
Python

from typing import TYPE_CHECKING, Any, cast
from .parser_schema import ArraySchemaConfig, resolve_parser_array_schema
from .utils.constants import STRING_DELIMITERS, JSONReturnType
from .utils.json_context import ContextValues
from .utils.object_comparer import ObjectComparer
if TYPE_CHECKING:
from .json_parser import JSONParser
def _resolve_array_item_schema(
schema_config: ArraySchemaConfig | None,
idx: int,
) -> tuple[dict[str, Any] | bool | None, bool]:
if schema_config is None:
return None, False
item_schema: dict[str, Any] | bool | None = None
drop_item = False
if isinstance(schema_config.items_schema, list):
if idx < len(schema_config.items_schema):
raw_schema = schema_config.items_schema[idx]
if raw_schema is not None and not isinstance(raw_schema, (dict, bool)):
raise ValueError("Schema must be an object.")
item_schema = cast("dict[str, Any] | bool | None", raw_schema)
elif schema_config.additional_items is False:
drop_item = True
elif isinstance(schema_config.additional_items, dict):
item_schema = cast("dict[str, Any]", schema_config.additional_items)
else:
item_schema = True
elif isinstance(schema_config.items_schema, dict):
item_schema = cast("dict[str, Any]", schema_config.items_schema)
else:
item_schema = True
return item_schema, drop_item
def parse_array(
self: "JSONParser",
schema: dict[str, Any] | bool | None = None,
path: str = "$",
closing_delimiter: str = "]",
) -> list[JSONReturnType]:
# <array> ::= '[' [ <json> *(', ' <json>) ] ']' ; A sequence of JSON values separated by commas
schema_repairer, _schema, schema_config = resolve_parser_array_schema(self.schema_repairer, schema)
salvage_mode = schema_repairer is not None and schema_repairer.schema_repair_mode == "salvage"
arr: list[JSONReturnType] = []
with self.context.enter(ContextValues.ARRAY):
self.skip_whitespaces()
char = self.get_char_at()
idx = 0
while char and char not in [closing_delimiter, "}"]:
item_schema, drop_item = _resolve_array_item_schema(schema_config, idx)
item_path = f"{path}[{idx}]"
active_schema_repairer = (
schema_repairer if schema_repairer is not None and not drop_item and not salvage_mode else None
)
if char in STRING_DELIMITERS:
# A string followed by ':' is often a missing object start; treat it as an object.
i = 1
i = self.skip_to_character(char, i)
i = self.scroll_whitespaces(idx=i + 1)
if self.get_char_at(i) == ":":
if active_schema_repairer is not None:
# Schema-guided object parsing, then enforce schema on the parsed object.
value = self.parse_object(item_schema, item_path)
value = active_schema_repairer.repair_value(value, item_schema, item_path)
else:
# No schema (or dropping): still parse to keep the cursor in sync.
value = self.parse_object()
else:
value = self.parse_string()
if active_schema_repairer is not None:
# Apply schema constraints/coercions to scalar values when configured.
value = active_schema_repairer.repair_value(value, item_schema, item_path)
else:
# Use schema-aware parsing to guide nested repairs when configured.
value = (
self.parse_json(item_schema, item_path) if active_schema_repairer is not None else self.parse_json()
)
if ObjectComparer.is_strictly_empty(value) and self.get_char_at() not in [closing_delimiter, ","]:
self.index += 1
elif value == "..." and self.get_char_at(-1) == ".":
self.log(
"While parsing an array, found a stray '...'; ignoring it",
)
elif not drop_item:
arr.append(value)
elif schema_repairer is not None:
# Record drops for visibility when schema forbids extra tuple items.
schema_repairer._log("Dropped extra array item not covered by schema", item_path)
idx += 1
char = self.get_char_at()
while char and char != closing_delimiter and (char.isspace() or char == ","):
self.index += 1
char = self.get_char_at()
if char != closing_delimiter:
self.log(
f"While parsing an array we missed the closing {closing_delimiter}, ignoring it",
)
self.index += 1
return arr