bioentities-preprocess/main.py

30 lines
924 B
Python
Raw Permalink Normal View History

2023-09-20 15:16:12 +02:00
from pdb.pdb_download import PDBDownloader
from pdb.pdb_metadata_extractor import MetadataExctractor
from pdb.pdb_validator import validate
2023-09-21 15:08:48 +02:00
from uniprot.download import UniprotSwissDownloader
from uniprot.metadata import MetadataExctractor as ME
from uniprot.uniprot_validator import validate as validate_uniprot
2023-09-20 15:16:12 +02:00
if __name__ == '__main__':
2023-09-22 14:24:03 +02:00
print("UNIPROT -PREPROCESSING")
2023-09-21 15:08:48 +02:00
u = UniprotSwissDownloader()
2023-09-22 14:24:03 +02:00
u.download()
2023-09-21 15:08:48 +02:00
k = ME()
2023-09-22 14:24:03 +02:00
k.extract_metadata()
error, valid, total, error_record = validate_uniprot()
print(error)
print(f"Valid {valid}/{total}")
print(f"Error {error_record}/{total}")
2023-09-22 14:24:03 +02:00
print("PDB -PREPROCESSING")
p = PDBDownloader()
p.get_file_to_downloads(max_item=4)
m = MetadataExctractor()
m.extract_metadata()
error, valid, total, error_record = validate()
print(error)
print(f"Valid {valid}/{total}")
print(f"Error {error_record}/{total}")
2023-09-21 15:08:48 +02:00