2022-10-31 20:01:42 +08:00
|
|
|
# Copyright 2022 Memgraph Ltd.
|
2022-10-12 22:35:47 +08:00
|
|
|
#
|
|
|
|
# Use of this software is governed by the Business Source License
|
|
|
|
# included in the file licenses/BSL.txt; by using this file, you agree to be bound by the terms of the Business Source
|
|
|
|
# License, and you may not use this file except in compliance with the Business Source License.
|
|
|
|
#
|
|
|
|
# As of the Change Date specified in that file, in accordance with
|
|
|
|
# the Business Source License, use of this software will be governed
|
|
|
|
# by the Apache License, Version 2.0, included in the file
|
|
|
|
# licenses/APL.txt.
|
|
|
|
|
2022-11-09 22:38:51 +08:00
|
|
|
import argparse
|
2022-10-12 22:35:47 +08:00
|
|
|
import random
|
2022-11-09 22:38:51 +08:00
|
|
|
|
2022-10-12 22:35:47 +08:00
|
|
|
import helpers
|
|
|
|
|
|
|
|
# Explaination of datasets:
|
|
|
|
# - empty_only_index: contains index; contains no data
|
|
|
|
# - small: contains index; contains data (small dataset)
|
|
|
|
#
|
|
|
|
# Datamodel is as follow:
|
|
|
|
#
|
|
|
|
# ┌──────────────┐
|
|
|
|
# │ Permission │
|
|
|
|
# ┌────────────────┐ │ Schema:uuid │ ┌────────────┐
|
2022-10-18 21:47:13 +08:00
|
|
|
# │:IS_FOR_IDENTITY├────┤ Index:name ├───┤:IS_FOR_FILE│
|
2022-10-12 22:35:47 +08:00
|
|
|
# └┬───────────────┘ └──────────────┘ └────────────┤
|
|
|
|
# │ │
|
2022-10-18 21:47:13 +08:00
|
|
|
# ┌──────▼──────────────┐ ┌──▼────────────────┐
|
|
|
|
# │ Identity │ │ File │
|
|
|
|
# │ Schema:uuid │ │ Schema:uuid │
|
|
|
|
# │ Index:email │ │ Index:name │
|
|
|
|
# └─────────────────────┘ │ Index:platformId │
|
|
|
|
# └───────────────────┘
|
2022-10-12 22:35:47 +08:00
|
|
|
#
|
2022-10-18 21:47:13 +08:00
|
|
|
# - File: attributes: ["uuid", "name", "platformId"]
|
2022-10-12 22:35:47 +08:00
|
|
|
# - Permission: attributes: ["uuid", "name"]
|
|
|
|
# - Identity: attributes: ["uuid", "email"]
|
|
|
|
#
|
|
|
|
# Indexes:
|
2022-10-18 21:47:13 +08:00
|
|
|
# - File: [File(uuid), File(platformId), File(name)]
|
2022-10-12 22:35:47 +08:00
|
|
|
# - Permission: [Permission(uuid), Permission(name)]
|
|
|
|
# - Identity: [Identity(uuid), Identity(email)]
|
|
|
|
#
|
|
|
|
# Edges:
|
2022-10-18 21:47:13 +08:00
|
|
|
# - (:Permission)-[:IS_FOR_FILE]->(:File)
|
2022-10-12 22:35:47 +08:00
|
|
|
# - (:Permission)-[:IS_FOR_IDENTITYR]->(:Identity)
|
|
|
|
#
|
2022-10-18 21:47:13 +08:00
|
|
|
# AccessControl specific: uuid is the schema
|
|
|
|
|
2022-10-31 20:02:05 +08:00
|
|
|
|
|
|
|
def main():
|
2022-10-18 21:47:13 +08:00
|
|
|
parser = argparse.ArgumentParser()
|
2023-02-18 00:33:24 +08:00
|
|
|
parser.add_argument(
|
|
|
|
"--number_of_identities",
|
|
|
|
type=int,
|
|
|
|
default=10,
|
|
|
|
help="Determines how many :Identity nodes will the dataset contain.",
|
|
|
|
)
|
|
|
|
parser.add_argument(
|
|
|
|
"--number_of_files", type=int, default=10, help="Determines how many :File nodes will the dataset contain."
|
|
|
|
)
|
|
|
|
parser.add_argument(
|
|
|
|
"--percentage_of_permissions",
|
|
|
|
type=float,
|
|
|
|
default=1.0,
|
|
|
|
help="Determines approximately what percentage of the all possible identity-permission-file connections will be created.",
|
|
|
|
)
|
|
|
|
parser.add_argument("--filename", default="dataset.cypher", help="The name of the output file.")
|
2022-10-18 21:47:13 +08:00
|
|
|
|
|
|
|
args = parser.parse_args()
|
|
|
|
|
|
|
|
number_of_identities = args.number_of_identities
|
|
|
|
number_of_files = args.number_of_files
|
|
|
|
percentage_of_permissions = args.percentage_of_permissions
|
|
|
|
filename = args.filename
|
|
|
|
|
2022-10-31 17:52:06 +08:00
|
|
|
assert number_of_identities >= 0
|
|
|
|
assert number_of_files >= 0
|
2022-10-18 21:47:13 +08:00
|
|
|
assert percentage_of_permissions > 0.0 and percentage_of_permissions <= 1.0
|
|
|
|
assert filename != ""
|
|
|
|
|
2022-11-02 21:14:16 +08:00
|
|
|
with open(filename, "w") as f:
|
2022-11-02 21:18:04 +08:00
|
|
|
f.write("MATCH (n) DETACH DELETE n;\n")
|
|
|
|
|
|
|
|
# Create the indexes
|
|
|
|
f.write("CREATE INDEX ON :File;\n")
|
|
|
|
f.write("CREATE INDEX ON :Permission;\n")
|
|
|
|
f.write("CREATE INDEX ON :Identity;\n")
|
|
|
|
f.write("CREATE INDEX ON :File(platformId);\n")
|
|
|
|
f.write("CREATE INDEX ON :File(name);\n")
|
|
|
|
f.write("CREATE INDEX ON :Permission(name);\n")
|
|
|
|
f.write("CREATE INDEX ON :Identity(email);\n")
|
|
|
|
|
|
|
|
# Create extra index: in distributed, this will be the schema
|
|
|
|
f.write("CREATE INDEX ON :File(uuid);\n")
|
|
|
|
f.write("CREATE INDEX ON :Permission(uuid);\n")
|
|
|
|
f.write("CREATE INDEX ON :Identity(uuid);\n")
|
|
|
|
|
|
|
|
uuid = 1
|
|
|
|
|
|
|
|
# Create the nodes File
|
|
|
|
for index in range(0, number_of_files):
|
|
|
|
f.write(f'CREATE (:File {{uuid: {uuid}, platformId: "platform_id", name: "name_file_{uuid}"}});\n')
|
|
|
|
uuid += 1
|
|
|
|
|
|
|
|
identities = []
|
|
|
|
# Create the nodes Identity
|
|
|
|
for index in range(0, number_of_identities):
|
|
|
|
f.write(f'CREATE (:Identity {{uuid: {uuid}, name: "mail_{uuid}@something.com"}});\n')
|
|
|
|
uuid += 1
|
|
|
|
|
|
|
|
for outer_index in range(0, number_of_files):
|
|
|
|
for inner_index in range(0, number_of_identities):
|
|
|
|
file_uuid = outer_index + 1
|
|
|
|
identity_uuid = number_of_files + inner_index + 1
|
|
|
|
|
|
|
|
if random.random() <= percentage_of_permissions:
|
|
|
|
f.write(f'CREATE (:Permission {{uuid: {uuid}, name: "name_permission_{uuid}"}});\n')
|
|
|
|
f.write(
|
|
|
|
f"MATCH (permission:Permission {{uuid: {uuid}}}), (file:File {{uuid: {file_uuid}}}) CREATE (permission)-[e: IS_FOR_FILE]->(file);\n"
|
|
|
|
)
|
|
|
|
f.write(
|
|
|
|
f"MATCH (permission:Permission {{uuid: {uuid}}}), (identity:Identity {{uuid: {identity_uuid}}}) CREATE (permission)-[e: IS_FOR_IDENTITY]->(identity);\n"
|
|
|
|
)
|
|
|
|
uuid += 1
|
2022-10-31 20:02:05 +08:00
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
main()
|