Skip to content
Snippets Groups Projects

Filling XLSX: Everything except multiple choice.

Merged Daniel Hornung requested to merge f-json-table into dev
All threads resolved!
Compare and Show latest version
4 files
+ 48
20
Compare changes
  • Side-by-side
  • Inline
Files
4
@@ -27,6 +27,7 @@ import pathlib
from collections import OrderedDict
from types import SimpleNamespace
from typing import Any, Dict, List, Optional, TextIO, Union
from warnings import warn
from jsonschema import FormatChecker, validate
from jsonschema.exceptions import ValidationError
@@ -54,11 +55,10 @@ def _get_column_types(sheet: Worksheet) -> OrderedDict:
type_row_index = _get_row_type_column_index(sheet)
for idx, col in enumerate(sheet.columns):
type_cell = col[type_row_index]
result[idx] = type_cell.value
assert (hasattr(ColumnType, type_cell.value)
or type_cell.value == RowType.COL_TYPE.name
or type_cell.value is None), (
f"Unexpected column type value: {type_cell.value}")
result[idx] = type_cell.value if type_cell.value is not None else ColumnType.IGNORE.name
assert (hasattr(ColumnType, result[idx])
or result[idx] == RowType.COL_TYPE.name), (
f"Unexpected column type value ({idx}{type_row_index}): {type_cell.value}")
return result
@@ -135,8 +135,9 @@ def _read_or_dict(data: Union[dict, str, TextIO]) -> dict:
class TemplateFiller:
"""Class to fill XLSX templates. Has an index for all relevant columns."""
def __init__(self, workbook: Workbook):
def __init__(self, workbook: Workbook, graceful: bool = False):
self._workbook = workbook
self._graceful = graceful
self._create_index()
@property
@@ -281,16 +282,17 @@ out: union[dict, None]
next_context = context.next_level(name)
# preprocessing
if isinstance(content, list):
if not content:
if not content: # empty list
continue
# Must be all of the same type.
# List elements must be all of the same type.
assert len(set(type(entry) for entry in content)) == 1
if isinstance(content[0], dict):
if isinstance(content[0], dict): # all elements are dicts
# An array of objects: must go into exploded sheet
for entry in content:
self._handle_data(data=entry, current_path=path, context=next_context)
continue
elif isinstance(content, dict):
elif isinstance(content, dict): # we recurse and simply use the result
if not current_path: # Special handling for top level
self._handle_data(content, current_path=path, context=next_context)
continue
@@ -301,26 +303,27 @@ out: union[dict, None]
insertables.update(insert)
continue
else: # scalars
content = [content]
content = [content] # make list for unified treatment below
# collecting the data
assert isinstance(content, list)
if len(content) == 1:
value = content[0]
else:
value = ";".join(content)
content = [str(x) for x in content]
value = ";".join(content) # TODO we need escaping of values
path_str = p2s(path)
assert path_str not in insertables
insertables[path_str] = value
if only_collect_insertables:
return insertables
if not current_path:
if not current_path: # Top level returns, because there are only sheets for the children.
return None
# actual data insertion
insert_row = None
sheet = None
for path_str, value in insertables.items():
if self._graceful and path_str not in self._sheet_index:
warn(f"Ignoring path with missing sheet index: {path_str}")
continue
sheet_meta = self._sheet_index[path_str]
if sheet is None:
sheet = sheet_meta.sheet
@@ -362,7 +365,8 @@ result: str
Path for the result XLSX.
validation_schema: dict, optional
If given, validate the date against this schema first. This raises an exception if the validation
fails.
fails. If no validation schema is given, try to ignore more errors in the data when filling the
XLSX template.
"""
data = _read_or_dict(data)
assert isinstance(data, dict)
@@ -375,10 +379,12 @@ validation_schema: dict, optional
except ValidationError as ve:
print(ve.message)
raise RuntimeError("Validation failed")
else:
print("No validation schema given, continue at your own risk.")
# Filling the data
result_wb = load_workbook(template)
template_filler = TemplateFiller(result_wb)
template_filler = TemplateFiller(result_wb, graceful=(validation_schema is None))
template_filler.fill_data(data=data)
parentpath = pathlib.Path(result).parent
Loading