Source code for skinfer.schema_inferer

from __future__ import absolute_import, print_function

import json
import gzip
from skinfer.draft4_generator import JsonSchemaGenerator
from skinfer.json_schema_merger import merge_schema


[docs]def gzopen(filename): if '.gz' in filename: return gzip.GzipFile(filename) return open(filename)
[docs]def load_samples_from_jsonlines(file_list): for filename in file_list: with gzopen(filename) as f: for line in f: yield json.loads(line)
[docs]def load_samples_from_json(file_list): for filename in file_list: with gzopen(filename) as f: yield json.load(f)
[docs]def load_samples(samples, jsonlines=False): if jsonlines: return load_samples_from_jsonlines(samples) return load_samples_from_json(samples)
[docs]def generate_schema_for_sample(sample): """Returns a schema generated for the given sample. """ return JsonSchemaGenerator(sample).generate()
[docs]def generate_and_merge_schemas(samples): """Iterates through the given samples, generating schemas and merging them, returning the resulting merged schema. """ merged = generate_schema_for_sample(next(iter(samples))) for sample in samples: merged = merge_schema(merged, generate_schema_for_sample(sample)) return merged