from __future__ import absolute_import, print_function
import json
import gzip
from skinfer.draft4_generator import JsonSchemaGenerator
from skinfer.json_schema_merger import merge_schema
[docs]def gzopen(filename):
if '.gz' in filename:
return gzip.GzipFile(filename)
return open(filename)
[docs]def load_samples_from_jsonlines(file_list):
for filename in file_list:
with gzopen(filename) as f:
for line in f:
yield json.loads(line)
[docs]def load_samples_from_json(file_list):
for filename in file_list:
with gzopen(filename) as f:
yield json.load(f)
[docs]def load_samples(samples, jsonlines=False):
if jsonlines:
return load_samples_from_jsonlines(samples)
return load_samples_from_json(samples)
[docs]def generate_schema_for_sample(sample):
"""Returns a schema generated for the given sample.
"""
return JsonSchemaGenerator(sample).generate()
[docs]def generate_and_merge_schemas(samples):
"""Iterates through the given samples, generating schemas
and merging them, returning the resulting merged schema.
"""
merged = generate_schema_for_sample(next(iter(samples)))
for sample in samples:
merged = merge_schema(merged, generate_schema_for_sample(sample))
return merged