|
1 | 1 | """Configuration for a cell lexical index.""" |
2 | 2 |
|
3 | 3 | import semra |
| 4 | +import semra.landscape.cell |
4 | 5 |
|
5 | 6 | import biolexica |
6 | 7 |
|
7 | 8 | __all__ = ["CELL_CONFIGURATION"] |
8 | 9 |
|
9 | | - |
10 | | -PRIORITY = [ |
11 | | - "cl", |
12 | | - "cellosaurus", |
13 | | - "bto", |
14 | | - "clo", |
15 | | - "efo", |
16 | | - "mesh", |
17 | | - "ccle", |
18 | | - "depmap", |
19 | | -] |
20 | | - |
21 | | - |
22 | | -SEMRA_CONFIG = semra.Configuration( |
23 | | - name="Cell and Cell Line Mappings", |
24 | | - description="Originally a reproduction of the EFO/Cellosaurus/DepMap/CCLE scenario " |
25 | | - "posed in the Biomappings paper, this configuration imports several different cell and " |
26 | | - "cell line resources and identifies mappings between them.", |
27 | | - inputs=[ |
28 | | - semra.Input(source="biomappings"), |
29 | | - semra.Input(source="gilda"), |
30 | | - semra.Input(prefix="cellosaurus", source="pyobo", confidence=0.99), |
31 | | - semra.Input(prefix="bto", source="bioontologies", confidence=0.99), |
32 | | - semra.Input(prefix="cl", source="bioontologies", confidence=0.99), |
33 | | - semra.Input(prefix="clo", source="custom", confidence=0.99), |
34 | | - semra.Input(prefix="efo", source="pyobo", confidence=0.99), |
35 | | - semra.Input( |
36 | | - prefix="depmap", |
37 | | - source="pyobo", |
38 | | - confidence=0.99, |
39 | | - extras={"version": "22Q4", "standardize": True, "license": "CC-BY-4.0"}, |
40 | | - ), |
41 | | - semra.Input( |
42 | | - prefix="ccle", |
43 | | - source="pyobo", |
44 | | - confidence=0.99, |
45 | | - extras={"version": "2019"}, |
46 | | - ), |
47 | | - semra.Input(prefix="ncit", source="pyobo", confidence=0.99), |
48 | | - semra.Input(prefix="umls", source="pyobo", confidence=0.99), |
49 | | - ], |
50 | | - add_labels=False, |
51 | | - priority=PRIORITY, |
52 | | - keep_prefixes=PRIORITY, |
53 | | - remove_imprecise=False, |
54 | | - mutations=[ |
55 | | - semra.Mutation(source="efo", confidence=0.7), |
56 | | - semra.Mutation(source="bto", confidence=0.7), |
57 | | - semra.Mutation(source="cl", confidence=0.7), |
58 | | - semra.Mutation(source="clo", confidence=0.7), |
59 | | - semra.Mutation(source="depmap", confidence=0.7), |
60 | | - semra.Mutation(source="ccle", confidence=0.7), |
61 | | - semra.Mutation(source="cellosaurus", confidence=0.7), |
62 | | - semra.Mutation(source="ncit", confidence=0.7), |
63 | | - semra.Mutation(source="umls", confidence=0.7), |
64 | | - ], |
65 | | -) |
66 | | - |
67 | 10 | CELL_CONFIGURATION = biolexica.Configuration( |
68 | 11 | inputs=[ |
69 | 12 | biolexica.Input( |
|
87 | 30 | ], |
88 | 31 | ), |
89 | 32 | ], |
90 | | - mapping_configuration=SEMRA_CONFIG, |
| 33 | + mapping_configuration=semra.landscape.cell.CELL_CONFIGURATION, |
91 | 34 | ) |
0 commit comments