[generation]
entity_count = 5000
seed = 98765
entity_distribution = "Weighted"
cardinality_strategy = "Random"
[generation.distribution_weights]
"http://example.org/Person" = 0.5
"http://example.org/Organization" = 0.3
"http://example.org/Course" = 0.2
[field_generators.default]
locale = "en"
quality = "High"
[field_generators.datatypes."http://www.w3.org/2001/XMLSchema#integer"]
generator = "integer"
[field_generators.datatypes."http://www.w3.org/2001/XMLSchema#integer".parameters]
min = 1
max = 10000
[field_generators.datatypes."http://www.w3.org/2001/XMLSchema#decimal"]
generator = "decimal"
[field_generators.datatypes."http://www.w3.org/2001/XMLSchema#decimal".parameters]
min = 0.0
max = 1000.0
precision = 2
[field_generators.datatypes."http://www.w3.org/2001/XMLSchema#date"]
generator = "date"
[field_generators.datatypes."http://www.w3.org/2001/XMLSchema#date".parameters]
start_year = 1980
end_year = 2024
[field_generators.datatypes."http://www.w3.org/2001/XMLSchema#string"]
generator = "string"
parameters = {}
[field_generators.properties."http://example.org/name"]
generator = "string"
parameters = {}
[field_generators.properties."http://schema.org/name"]
generator = "string"
parameters = {}
[field_generators.properties."http://schema.org/email"]
generator = "string"
[field_generators.properties."http://schema.org/email".parameters]
templates = [
"{firstName}.{lastName}@{domain}",
"{firstName}{lastName}{number}@{domain}",
"info@{domain}",
"contact@{domain}"
]
[field_generators.properties."http://example.org/legalName"]
generator = "string"
parameters = {}
[field_generators.properties."http://example.org/address"]
generator = "string"
parameters = {}
[field_generators.properties."http://example.org/phone"]
generator = "string"
parameters = {}
[output]
path = "large_dataset.ttl.gz"
format = "Turtle"
compress = true
write_stats = true
parallel_writing = true
parallel_file_count = 8
[parallel]
worker_threads = 8
batch_size = 250
parallel_shapes = true
parallel_fields = true