-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig_xml.json
75 lines (75 loc) · 2.63 KB
/
config_xml.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
{
"llm_model": "gemini-2.0-flash-exp",
"entire_document_models": ["gemini-1.5-flash", "gemini-1.5-pro", "gemini-2.0-flash-exp", "gpt-4o", "gpt-4o-mini"],
"process_entire_document": true,
"prompt_dir": "prompts/prompt_templates",
"prompt_save_dir": "prompts/prompt_evals",
"response_file": "LLMs_responses.json",
"process_DAS_links_separately": false,
"save_xml_output": false,
"save_dynamic_prompts": true,
"html_xml_dir": "html_xml_samples/",
"repos": {
"bigd.big.ac.cn": {
"repo_name": "BIGD",
"url_concat_string": "/browse/__ID__",
"download_root": "https://download.cncb.ac.cn/gsa/__ID__"
},
"massive.ucsd.edu": {
"repo_name": "MassIVE",
"url_concat_string": "/ProteoSAFe/dataset.jsp?accession=__ID__",
"download_root": "ftp://massive.ucsd.edu/v06/__ID__/"
},
"www.ebi.ac.uk": {
"repo_name": "PRIDE",
"url_concat_string": "/pride/archive/projects/__ID__",
"download_root": "https://ftp.pride.ebi.ac.uk/pride/data/archive/2024/07/__ID__/"
},
"www.iprox.cn": {
"repo_name": "iProX",
"url_concat_string": "/page/project.html?id=__ID__",
"download_root": ""
},
"proteomecentral.proteomexchange.org": {
"repo_name": "ProteomeCentral",
"url_concat_string": "/cgi/GetDataset?ID=__ID__",
"download_root": ""
},
"www.proteomexchange.org": {
"repo_name": "ProteomeXchange",
"url_concat_string": "/cgi/GetDataset?ID=__ID__",
"repo_mapping" : "proteomecentral.proteomexchange.org",
"download_root": ""
},
"pdc.cancer.gov": {
"repo_name": "Proteomic Data Commons",
"url_concat_string": "/pdc/study/__ID__"
},
"doi.org": {
"dataset_webpage_url_ptr": "https\\:\\/\\/doi\\.org\\/\\d+\\.\\d+\\/pdb([\\w\\d]+)\\/pdb"
},
"www.ncbi.nlm.nih.gov": {
"dataset_webpage_url_ptr": "https\\:\\/www\\.ncbi\\.nlm\\.nih\\.gov\\/geo\\/query\/acc\\.cgi\\?acc=__ID__"
}
},
"data_availability_sections": [
".//sec[@sec-type='data-availability']",
".//notes[@notes-type='data-availability']",
".//notes[@notes-type='data-availability']"
],
"supplementary_material_sections": [
".//sec[@sec-type='supplementary-material']",
".//supplementary-material"
],
"supplementary_data_sections": [
".//sec[@sec-type='supplementary-material']",
".//supplementary-material",
".//sec[@sec-type='associated-data']",
".//sec[@sec-type='extended-data']",
".//sec[@sec-type='samples-and-clinical-data']",
".//sec[@sec-type='footnotes']"
],
"key_resources_table": [
"//sec[.//title[contains(text(), \"Key resources table\")]]//table-wrap"
]
}