Skip to content

Commit afc1936

Browse files
authored
Merge pull request #1185 from dondi/maika-database
#1120 #1164 Fix for updating data
2 parents 170670f + e939f93 commit afc1936

File tree

8 files changed

+14
-360
lines changed

8 files changed

+14
-360
lines changed

database/network-database/constants.py

+1-12
Original file line numberDiff line numberDiff line change
@@ -13,15 +13,4 @@ class Constants:
1313
PROTEIN_DATA_FILEPATH = DATA_DIRECTORY + "/protein_data.tsv"
1414
GENE_REGULATORY_NETWORK_DATA_FILEPATH = DATA_DIRECTORY + "/gene_regulatory_network_data.tsv"
1515
PROTEIN_PROTEIN_INTERACTIONS_DATA_FILEPATH = DATA_DIRECTORY + "/protein_protein_interactions_data.tsv"
16-
SOURCE_DATA_FILEPATH = DATA_DIRECTORY + "/source_data.tsv"
17-
18-
# missing and update file paths
19-
MISSING_DATA_DIRECTORY = DATA_DIRECTORY + "/missing_data"
20-
UPDATE_DATA_DIRECTORY = DATA_DIRECTORY + "/update_data"
21-
MISSING_GRN_GENE_DATA_FILEPATH = MISSING_DATA_DIRECTORY + "/missing_grn_gene_data.tsv"
22-
UPDATE_GRN_GENE_DATA_FILEPATH = UPDATE_DATA_DIRECTORY + "/update_grn_gene_data.tsv"
23-
MISSING_PPI_GENE_DATA_FILEPATH = MISSING_DATA_DIRECTORY + "/missing_ppi_gene_data.tsv"
24-
UPDATE_PPI_GENE_DATA_FILEPATH = UPDATE_DATA_DIRECTORY + "/update_ppi_gene_data.tsv"
25-
MISSING_PROTEIN_DATA_FILEPATH = MISSING_DATA_DIRECTORY + "/missing_protein_data.tsv"
26-
UPDATE_PROTEIN_DATA_FILEPATH = UPDATE_DATA_DIRECTORY + "/update_protein_data.tsv"
27-
UPDATE_PROTEIN_NAME_DATA_FILEPATH = UPDATE_DATA_DIRECTORY + "/update_protein_name_data.tsv"
16+
SOURCE_DATA_FILEPATH = DATA_DIRECTORY + "/source_data.tsv"

database/network-database/database_services/README.md

+1-3
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,4 @@ This folder contains all services for database operations. **Note:** This folder
44

55
## File Descriptions
66

7-
- **`filter.py`** – Retrieves data from the database and identifies new or updated records.
8-
- **`populator.py`** – Handles inserting new data into the database.
9-
- **`updater.py`** – Defines the process for updating existing records when necessary.
7+
- **`populator.py`** – Handles inserting new data into the database.

database/network-database/database_services/filter.py

-156
This file was deleted.

database/network-database/database_services/populator.py

+3-4
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ def process_file(self, conn, cursor, data_filepath, copy_statement):
3232
"""
3333

3434
# Determine if we need to drop the last column (PPI network type)
35-
if self.network_mode == Constants.PPI_NETWORK_MODE and data_filepath == Constants.MISSING_PPI_GENE_DATA_FILEPATH:
35+
if self.network_mode == Constants.PPI_NETWORK_MODE and data_filepath == Constants.GENE_DATA_FILEPATH:
3636
print("Dropping the regulator column from the input data...")
3737
processed_rows = []
3838

@@ -72,12 +72,11 @@ class GeneDataPopulator(DataPopulator):
7272
def __init__(self, db_url, network_mode):
7373
super().__init__(db_url)
7474
self.network_mode = network_mode
75+
self.filepath = Constants.GENE_DATA_FILEPATH
7576
if network_mode == Constants.GRN_NETWORK_MODE:
7677
self.database_namespace = Constants.GRN_DATABASE_NAMESPACE
77-
self.filepath = Constants.MISSING_GRN_GENE_DATA_FILEPATH
7878
elif network_mode == Constants.PPI_NETWORK_MODE:
7979
self.database_namespace = Constants.PPI_DATABASE_NAMESPACE
80-
self.filepath = Constants.MISSING_PPI_GENE_DATA_FILEPATH
8180
else:
8281
raise ValueError(f"Unknown network type: {network_mode}")
8382

@@ -92,7 +91,7 @@ def get_copy_statement(self):
9291
class ProteinDataPopulator(DataPopulator):
9392
def __init__(self, db_url):
9493
super().__init__(db_url)
95-
self.filepath = Constants.MISSING_PROTEIN_DATA_FILEPATH
94+
self.filepath = Constants.PROTEIN_DATA_FILEPATH
9695

9796
def get_copy_statement(self):
9897
return f"COPY {Constants.PPI_DATABASE_NAMESPACE}.protein (standard_name, gene_systematic_name, length, molecular_weight, PI, taxon_id, time_stamp, source) FROM stdin WITH CSV DELIMITER E'\\t' HEADER;"

database/network-database/database_services/updater.py

-157
This file was deleted.

0 commit comments

Comments
 (0)