Coverage for biobb_io/api/memprotmd_sim_search.py: 73%

41 statements  

« prev     ^ index     » next       coverage.py v7.5.3, created at 2024-06-14 18:20 +0000

1#!/usr/bin/env python 

2 

3"""Module containing the MemProtMDSimSearch class and the command line interface.""" 

4import argparse 

5from biobb_common.generic.biobb_object import BiobbObject 

6from biobb_common.configuration import settings 

7from biobb_common.tools.file_utils import launchlogger 

8from biobb_io.api.common import check_output_path, get_memprotmd_sim_search, write_json 

9 

10 

11class MemProtMDSimSearch(BiobbObject): 

12 """ 

13 | biobb_io MemProtMDSimSearch 

14 | This class is a wrapper of the MemProtMD to perform advanced searches in the MemProtMD DB using its REST API. 

15 | Wrapper for the `MemProtMD DB REST API <http://memprotmd.bioch.ox.ac.uk/>`_ to perform advanced searches. 

16 

17 Args: 

18 output_simulations (str): Path to the output JSON file. File type: output. `Sample file <https://github.com/bioexcel/biobb_io/raw/master/biobb_io/test/reference/api/output_sim_search.json>`_. Accepted formats: json (edam:format_3464). 

19 properties (dic - Python dictionary object containing the tool parameters, not input/output files): 

20 * **collection_name** (*str*) - ("refs") Name of the collection to query. 

21 * **keyword** (*str*) - (None) String to search for in the database metadata. Examples are families like gpcr or porin. Values: porin, outer membrane protein, membrane protein, gpcr (7-transmembrane domain receptors transducing extracellular signals into cells), ion channels, rhodopsin (The most famous GPCRs), abc, mip (Major Intrinsic Protein (MIP)/FNT superfamily: specific for the transport of water and small neutral solutes), ligand-gated (Ligand-dependent signal conversion from chemical signals to electric signals), ammonia (Regulating transepithelial ammonia secretion), mapeg (Eicosanoid and Glutathione metabolism proteins), transmembrane (Heme biosynthesis), protein, kinase (Tyrosine-protein kinases: regulate central nervous system; gene transcription and cell differentiation), glycoprotein (Expression of TCR complex), immunoglobulin (Recognition; binding and adhesion process of cells), integrin (Bridges for cell-cell and cell-extracellular matrix interaction), bnip3 (BNip3 protein family: protect cell from apoptosis), bcl-2 (Regulating cell-death; either induce apoptotic or inhibit apoptosis), atpase (ATPase regulators; P-P-bond hydrolysis-driven transporter), cytochrome (Terminal oxidase enzyme in electron transfer chain), nadp (Transmembrane proteins with NAD(P)-binding Rossmann-fold domains: monoamine oxidase; deaminates norepinephrine; epinephrine; serotonin and dopamine), a4 (Amyloid beta A4 protein; involved in alzheimer's diseases), lysosome (Lysosome-associated membrane glycoprotein: specific to lysosomes; CD107), necrosis (Tumor necrosis factor recepto: binding with TNF and NGF; interacting with a variety of signal molecules; highly associated with apoptosis), oxidoreductase (DHODH; biosynthesis of orotate), ceramidase (Neutral/alkaline ceramidase: converting sphingolipid to sphingosine), dehydrogenase (Aldehyde dehydrogenase:ALDH; Oxidation of aldehydes), mitochondrial, plastid. 

22 * **remove_tmp** (*bool*) - (True) [WF property] Remove temporal files. 

23 * **restart** (*bool*) - (False) [WF property] Do not execute if output files exist. 

24 * **sandbox_path** (*str*) - ("./") [WF property] Parent path to the sandbox directory. 

25 

26 Examples: 

27 This is a use example of how to use the building block from Python:: 

28 

29 from biobb_io.api.memprotmd_sim_search import memprotmd_sim_search 

30 prop = { 

31 'collection_name': 'refs', 

32 'keyword': 'porin' 

33 } 

34 memprotmd_sim_search(output_simulations='/path/to/newSimulationSearch.json', 

35 properties=prop).launch() 

36 

37 Info: 

38 * wrapped_software: 

39 * name: MemProtMD DB 

40 * license: Creative Commons 

41 * ontology: 

42 * name: EDAM 

43 * schema: http://edamontology.org/EDAM.owl 

44 

45 """ 

46 

47 def __init__(self, output_simulations, 

48 properties=None, **kwargs) -> None: 

49 properties = properties or {} 

50 

51 # Call parent class constructor 

52 super().__init__(properties) 

53 self.locals_var_dict = locals().copy() 

54 

55 # Input/Output files 

56 self.io_dict = { 

57 "out": {"output_simulations": output_simulations} 

58 } 

59 

60 # Properties specific for BB 

61 self.collection_name = properties.get('collection_name', 'refs') 

62 self.keyword = properties.get('keyword', None) 

63 self.properties = properties 

64 

65 # Check the properties 

66 self.check_properties(properties) 

67 self.check_arguments() 

68 

69 def check_data_params(self, out_log, err_log): 

70 """ Checks all the input/output paths and parameters """ 

71 self.output_simulations = check_output_path(self.io_dict["out"]["output_simulations"], "output_simulations", False, out_log, self.__class__.__name__) 

72 

73 @launchlogger 

74 def launch(self) -> int: 

75 """Execute the :class:`MemProtMDSimSearch <api.memprotmd_sim_search.MemProtMDSimSearch>` api.memprotmd_sim_search.MemProtMDSimSearch object.""" 

76 

77 # check input/output paths and parameters 

78 self.check_data_params(self.out_log, self.err_log) 

79 

80 # Setup Biobb 

81 if self.check_restart(): 

82 return 0 

83 

84 self.keyword = self.keyword.strip().lower() 

85 

86 # get JSON object 

87 json_string = get_memprotmd_sim_search(self.collection_name, self.keyword, self.out_log, self.global_log) 

88 

89 # write JSON file 

90 write_json(json_string, self.output_simulations, self.out_log, self.global_log) 

91 

92 self.check_arguments(output_files_created=True, raise_exception=False) 

93 

94 return 0 

95 

96 

97def memprotmd_sim_search(output_simulations: str, properties: dict = None, **kwargs) -> int: 

98 """Execute the :class:`MemProtMDSimSearch <api.memprotmd_sim_search.MemProtMDSimSearch>` class and 

99 execute the :meth:`launch() <api.memprotmd_sim_search.MemProtMDSimSearch.launch>` method.""" 

100 

101 return MemProtMDSimSearch(output_simulations=output_simulations, 

102 properties=properties, **kwargs).launch() 

103 

104 

105def main(): 

106 """Command line execution of this building block. Please check the command line documentation.""" 

107 parser = argparse.ArgumentParser(description="Wrapper for the MemProtMD DB REST API (http://memprotmd.bioch.ox.ac.uk/) to perform advanced searches.", formatter_class=lambda prog: argparse.RawTextHelpFormatter(prog, width=99999)) 

108 parser.add_argument('-c', '--config', required=False, help="This file can be a YAML file, JSON file or JSON string") 

109 

110 # Specific args of each building block 

111 required_args = parser.add_argument_group('required arguments') 

112 required_args.add_argument('-o', '--output_simulations', required=True, help="Path to the output JSON file. Accepted formats: json.") 

113 

114 args = parser.parse_args() 

115 config = args.config if args.config else None 

116 properties = settings.ConfReader(config=config).get_prop_dic() 

117 

118 # Specific call of each building block 

119 memprotmd_sim_search(output_simulations=args.output_simulations, 

120 properties=properties) 

121 

122 

123if __name__ == '__main__': 

124 main()