release commit
This commit is contained in:
.bumpversion.cfg.env.example
.gitea/actions/test
.gitignore.gitmodules.pre-commit-config.yamlDockerfileLICENSEREADME.mdbiocypher
__init__.py
_config
__init__.pybiocypher_config.yamltest_config.yamltest_schema_config.yamltest_schema_config_disconnected.yamltest_schema_config_extended.yaml
_core.py_create.py_deduplicate.py_get.py_logger.py_mapping.py_metadata.py_misc.py_ontology.py_translate.pyoutput
config
docker-compose.ymlentrypoint.shfhirImport.pygraphCreation
import_fhir_to_nx_diGraph.pyimport_nx_diGraph.pyinit-scripts
mockData
pipeline.pumlpoetry.lockpyproject.tomlrequirements.txtschema_config_generation.pytestData
Alfonzo975_Medhurst46_cab042ec-9851-e5ed-80c8-0952376f5b08.jsonArmand155_Wilkinson796_4b633a8e-a312-8675-4af4-3519bfa6b00e.jsonConrad619_Zemlak964_881bcdd0-ce56-0da9-f297-696da35bd4a3.jsonDaysi106_Borer986_0096fcc6-e2d6-5aed-4790-beda6322c9be.jsonDomingo513_Durgan499_97fcce97-37ab-3fa7-d3d7-0729d60afcb5.jsonDonnell534_Koss676_5fcaaba4-cfdf-43a8-95c6-7d9f2fa6905e.jsonDorthy94_Klocko335_50390ac6-8c15-46f2-3b23-767f52a2e80c.jsonEmmie273_Reinger292_630e4b67-6e16-6bc7-6f28-2544b1a5d4d7.jsonFlorentino8_Abshire638_462cc215-c055-3e77-8e4c-9d3bf7f886f5.jsonJadwiga271_Thompson596_9973ad84-42ec-deda-23c2-906f81838e93.jsonJimmie93_Pfeffer420_b60cecd8-24c6-7983-3915-3bd6e8ede863.jsonJohnny786_Schoen8_a7a285c0-4714-dd3c-4837-8719c9b67873.jsonLala778_Jerilyn993_Cole117_ecf9d885-b712-e318-a6fa-f1ec9ffdbde8.jsonLilia791_Herrera193_8ebd900a-3563-5008-1fa9-9614ef666647.jsonLois157_Becker968_258cfb42-3e7c-be88-92fd-f31c94f3e76e.jsonMarlana402_Hansen121_8c570871-8d00-8c04-5da3-1ef43ed00f76.jsonMonte325_Prosacco716_2268a882-1b01-f71f-4377-a0dd87a78dd9.jsonMurray856_Lesch175_0759e805-61d1-ba2b-8b14-9e4308784a84.jsonNiesha86_Anderson154_2e96848a-43c1-78ea-16f2-d9d471d0f9d2.jsonPerry780_Gaylord332_c6456550-9c7a-0cf3-c18b-b266ba91ef1b.jsonPetronila724_Rutherford999_ec8f677e-0e42-d13a-b292-ff50216121b2.jsonVernetta697_Garnett735_Schaden604_d69b1a9b-e1e3-0b42-07c1-b37cae947f7f.jsonhospitalInformation1693908535569.jsonpractitionerInformation1693908535569.json
18
config/biocypher_config.yaml
Normal file
18
config/biocypher_config.yaml
Normal file
@ -0,0 +1,18 @@
|
||||
# add your settings here (overriding the defaults)
|
||||
|
||||
biocypher:
|
||||
dbms: neo4j
|
||||
offline: true
|
||||
#debug: true
|
||||
output_directory: /neo4j_import #comment if you want to debug, so that bc creates a new folder for each run in /biocypher-out
|
||||
schema_config_path: config/automated_schema.yaml
|
||||
|
||||
head_ontology:
|
||||
url: config/head_ontology/biolink-model.owl.ttl
|
||||
root_node: entity
|
||||
|
||||
neo4j:
|
||||
delimiter: '\t'
|
||||
array_delimiter: '|'
|
||||
skip_duplicate_nodes: true
|
||||
skip_bad_relationships: true
|
9088
config/head_ontology/biolink-model.owl.ttl
Normal file
9088
config/head_ontology/biolink-model.owl.ttl
Normal file
File diff suppressed because it is too large
Load Diff
283
config/manual_schema_config.yaml
Normal file
283
config/manual_schema_config.yaml
Normal file
@ -0,0 +1,283 @@
|
||||
Title: BioCypher graph schema configuration file
|
||||
|
||||
# This configuration file establishes the hierarchy and connectivity in a newly
|
||||
# set-up BioCypher property graph database. Naming should adhere to Biolink
|
||||
# nomenclature (available at https://biolink.github.io/biolink-model/ or via
|
||||
# the python module 'biolink-model-toolkit').
|
||||
|
||||
# The BioCypher YAML file specifies only the leaves of the hierarchy tree of
|
||||
# the desired graph; the hierarchical structure of entities will be derived
|
||||
# from the Biolink model + BRO model. Thus, only the immediate constituents
|
||||
# of the graph need to be specified in the schema config.
|
||||
|
||||
|
||||
# ---
|
||||
# "Named Things"
|
||||
# ---
|
||||
# The implementation of named things is fairly straightforward, since they are
|
||||
# usually represented in node form, which is also the Biolink recommendation.
|
||||
# The same is not true for associations.
|
||||
#
|
||||
# A little more complex is the representation of aggregates of named things.
|
||||
|
||||
clinicalStatus:
|
||||
is_a: ClinicalEntity
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: clinicalStatus
|
||||
properties:
|
||||
coding_system: str
|
||||
label: str
|
||||
coding_code: str
|
||||
|
||||
Condition:
|
||||
is_a: ClinicalEntity
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: Condition
|
||||
properties:
|
||||
input_format: HL7 FHIR
|
||||
data_specification: Medical Informatics Initiative Germany Core Data Set, Basic Modules
|
||||
|
||||
diagnosis:
|
||||
is_a: ClinicalEntity
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: diagnosis
|
||||
properties:
|
||||
type.coding_code: str
|
||||
sequence: str
|
||||
label: str
|
||||
type.coding_system: str
|
||||
|
||||
DiagnosticReport:
|
||||
is_a: ClinicalEntity
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: DiagnosticReport
|
||||
properties:
|
||||
resourceType: str
|
||||
label: str
|
||||
status: str
|
||||
id: str
|
||||
|
||||
Encounter:
|
||||
is_a: ClinicalEntity
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: Encounter
|
||||
properties:
|
||||
resourceType: str
|
||||
label: str
|
||||
status: str
|
||||
id: str
|
||||
|
||||
identifier:
|
||||
is_a: Attribute
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: identifier
|
||||
properties:
|
||||
label: str
|
||||
value: str
|
||||
system: str
|
||||
|
||||
interpretation: #
|
||||
is_a: named thing
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: interpretation
|
||||
properties:
|
||||
extension.valueCoding_system: str
|
||||
extension_url: str
|
||||
extension.valueCoding_display: str
|
||||
coding_code: str
|
||||
coding_system: str
|
||||
label: str
|
||||
extension.valueCoding_code: str
|
||||
|
||||
maritalStatus:
|
||||
is_a: OrganismAttribute
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: maritalStatus
|
||||
properties:
|
||||
label: str
|
||||
coding_system: str
|
||||
coding_code: str
|
||||
|
||||
Observation:
|
||||
is_a: ClinicalEntity
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: Observation
|
||||
properties:
|
||||
resourceType: str
|
||||
label: str
|
||||
effectiveDateTime: str
|
||||
status: str
|
||||
id: str
|
||||
|
||||
Organization:
|
||||
is_a: AdministrativeEntity
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: Organization
|
||||
properties:
|
||||
label: str
|
||||
id: str
|
||||
name: str
|
||||
resourceType: str
|
||||
|
||||
Patient:
|
||||
is_a: Human
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: Patient
|
||||
properties:
|
||||
resourceType: str
|
||||
label: str
|
||||
gender: str
|
||||
id: str
|
||||
birthDate: str
|
||||
|
||||
Procedure:
|
||||
# is_a: Procedure
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: Procedure
|
||||
properties:
|
||||
label: str
|
||||
performedDateTime: str
|
||||
resourceType: str
|
||||
status: str
|
||||
id: str
|
||||
|
||||
referenceRange: #
|
||||
is_a: named thing
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: referenceRange
|
||||
properties:
|
||||
high_system: str
|
||||
high_value: str
|
||||
high_code: str
|
||||
label: str
|
||||
high_unit: str
|
||||
|
||||
search: #
|
||||
is_a: named thing
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: search
|
||||
properties:
|
||||
label: str
|
||||
mode: str
|
||||
|
||||
type:
|
||||
is_a: Attribute
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: type
|
||||
properties:
|
||||
coding_system: str
|
||||
label: str
|
||||
coding_code: str
|
||||
coding_display: str
|
||||
|
||||
verificationStatus:
|
||||
is_a: Attribute
|
||||
represented_as: node
|
||||
preferred_id: fhir_id
|
||||
label_in_input: verificationStatus
|
||||
properties:
|
||||
coding_system: str
|
||||
label: str
|
||||
coding_code: str
|
||||
coding_display: str
|
||||
|
||||
|
||||
# ---
|
||||
# Associations
|
||||
# ---
|
||||
# Associations are not supposed to be represented in node form as per the
|
||||
# specifications of Biolink. However, in an analytic context, it often makes
|
||||
# sense to represent interactions as nodes in Neo4j, because it enables, for
|
||||
# instance, the annotation of a relationship with a publication as source of
|
||||
# evidence (also known as reification in the knowledge graph world).
|
||||
|
||||
# The Biolink specifications for these types of relationships do
|
||||
# not go into depth; for example, the hierarchy for molecular interactions
|
||||
# (ie, "associations") ends at "PairwiseMolecularInteraction", there are no
|
||||
# explicit terms for protein-protein-interaction, phosphorylation, miRNA-
|
||||
# targeting, etc. Biolink proposes to use interaction identifiers from
|
||||
# ontologies, such as https://www.ebi.ac.uk/ols/ontologies/mi/.
|
||||
|
||||
# association to connect anything to an identifier node
|
||||
# if functional, includes:
|
||||
# IDENTIFIED_BY_Condition_Identifier,
|
||||
# IDENTIFIED_BY_DiagnosticReport_Identifier,
|
||||
# IDENTIFIED_BY_Encounter_Identifier,
|
||||
# IDENTIFIED_BY_Observation_Identifier,
|
||||
# IDENTIFIED_BY_Organization_Identifier
|
||||
# IDENTIFIED_BY_Patient_Identifier,
|
||||
# IDENTIFIED_BY_Procedure_Identifier
|
||||
|
||||
condition to identifier association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: IDENTIFIED_BY_Condition_Identifier
|
||||
|
||||
diagnostic report to identifier association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: IDENTIFIED_BY_DiagnosticReport_Identifier
|
||||
|
||||
observation to identifier association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: IDENTIFIED_BY_Observation_Identifier
|
||||
|
||||
observation derived from observation association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: DERIVED_FROM_Observation_Observation
|
||||
|
||||
observation has member observation association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: HAS_MEMBER_Observation_Observation
|
||||
|
||||
procedure to identifier association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: IDENTIFIED_BY_Procedure_Identifier
|
||||
|
||||
procedure to diagnostic report association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: IDENTIFIED_BY_Procedure_Identifier
|
||||
|
||||
procedure reasoned by observation association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: HAS_REASON_REFERENCE_Procedure_Observation
|
||||
|
||||
procedure performer is practitioner association:
|
||||
is_a: association
|
||||
represented_as: edge
|
||||
label_in_input: HAS_ACTOR_ProcedurePerformer_Practitioner
|
||||
|
||||
#represented_as: edge
|
||||
#label_in_input: DERIVED_FROM_Observation_Observation:
|
||||
#represented_as: edge
|
||||
#label_in_input: DERIVED_FROM_Observation_Observation
|
||||
#protein interaction:
|
||||
# is_a: Pairwise molecular interaction
|
||||
# represented_as: edge
|
||||
# label_in_input: protein_protein_interaction
|
||||
|
||||
#protein to disease association:
|
||||
# is_a: Association
|
||||
# represented_as: edge
|
||||
# label_in_input: protein_disease_association
|
Reference in New Issue
Block a user