forked from TineClaeys/Eubic_Dev_hackathon_2025
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcolumn_name_to_entity.py
169 lines (168 loc) · 5.51 KB
/
column_name_to_entity.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
column_to_entity_mapping = {
"source name": "SourceName",
"characteristics[age]": "Age",
"characteristics[ancestry category]": "AncestryCategory",
"characteristics[biological replicate]": "BiologicalReplicate",
"characteristics[cell type]": "CellType",
"characteristics[compound]": "Compound",
"characteristics[developmental stage]": "DevelopmentalStage",
"characteristics[disease]": "Disease",
"characteristics[enrichment process]": "EnrichmentProcess",
"characteristics[individual]": "Individual",
"characteristics[organism part]": "OrganismPart",
"characteristics[organism]": "Organism",
"characteristics[sex]": "Sex",
"technology type": "TechnologyType",
"assay name": "AssayName",
"comment[cleavage agent details]": "CleavageAgentDetails",
"comment[data file]": "DataFile",
"comment[fraction identifier]": "FractionIdentifier",
"comment[fragment mass tolerance]": "FragmentMassTolerance",
"comment[instrument]": "Instrument",
"comment[label]": "Label",
"comment[modification parameters]": "ModificationParameters",
"comment[precursor mass tolerance]": "PrecursorMassTolerance",
"comment[technical replicate]": "TechnicalReplicate",
"characteristics[cell line]": "CellLine",
"material type": "MaterialType",
"comment[fractionation method]": "FractionationMethod",
"comment[separation]": "Separation",
"comment[dissociation method]": "DissociationMethod",
"comment[collision energy]": "CollisionEnergy",
"comment[MS2 analyzer type]": "MS2AnalyzerType",
"comment[proteomics data acquisition method]": "ProteomicsDataAcquisitionMethod",
"characteristics[strain]": "Strain",
"characteristics[cell part]": "CellPart",
"characteristics[sampling time]": "SamplingTime",
"characteristics[enrichment method]": "EnrichmentMethod",
"characteristics[treatment]": "Treatment",
"characteristics[region]": "Region",
"characteristics[synthetic peptide]": "SyntheticPeptide",
"comment[ms2 mass analyzer]": "MS2MassAnalyzer",
"characteristics[temperature]": "Temperature",
"characteristics[growth rate]": "GrowthRate",
"characteristics[overproduction]": "Overproduction",
"characteristics[spiked compound]": "SpikedCompound",
"characteristics[timepoint]": "Timepoint",
"characteristics[pool]": "Pool",
"characteristics[depletion]": "Depletion",
"characteristics[genetic modification]": "GeneticModification",
"characteristics[pooled sample]": "PooledSample",
"characteristics[xenograft]": "Xenograft",
"characteristics[protocol]": "Protocol",
"characteristics[staining]": "Staining",
"characteristics[strain/breed]": "StrainBreed",
"characteristics[genotype]": "Genotype",
"comment[number of missed cleavages]": "NumberOfMissedCleavages",
"characteristics[Anatomic Site Tumor]": "AnatomicSiteTumor",
"characteristics[Origin Site Disease]": "OriginSiteDisease",
"characteristics[Tumor Cellularity]": "TumorCellularity",
"characteristics[Tumor Grade]": "TumorGrade",
"characteristics[Tumor Stage Ovary FIGO]": "TumorStageOvaryFIGO",
"characteristics[Individual]": "Individual",
"characteristics[bait]": "Bait",
"comment[depletion]": "Depletion",
"characteristics[transfect]": "Transfect",
"characteristics[specimen]": "Specimen",
"comment[rice strain]": "RiceStrain",
"characteristics[sample amount]": "SampleAmount",
"characteristics[BMI]": "BMI",
"characteristics[cultured cell]": "CulturedCell",
"comment[collision energy]": "CollisionEnergy",
"characteristics[tumor size]": "TumorSize",
"characteristics[concentration of compound]": "ConcentrationOfCompound",
"characteristics[tumor stage]": "TumorStage",
"characteristics[Tumor site]": "TumorSite",
"characteristics[time]": "Time",
"characteristics[experiment]": "Experiment",
"comment[biological replicate]": "BiologicalReplicate",
"comment[flow rate chromatogram]": "FlowRateChromatogram",
"comment[gradient time]": "GradientTime",
"comment[enrichment method]": "EnrichmentMethod",
"characteristics[technical replicate]": "TechnicalReplicate",
"comment [cleavage agent details]": "CleavageAgentDetails",
"comment[technical replcate]": "TechnicalReplicate"
}
column_to_entity_mapping.values()
# SourceName
# Age
# AncestryCategory
# BiologicalReplicate
# CellType
# Compound
# DevelopmentalStage
# Disease
# EnrichmentProcess
# Individual
# OrganismPart
# Organism
# Sex
# TechnologyType
# AssayName
# CleavageAgentDetails
# DataFile
# FractionIdentifier
# FragmentMassTolerance
# Instrument
# Label
# ModificationParameters
# PrecursorMassTolerance
# TechnicalReplicate
# CellLine
# MaterialType
# FractionationMethod
# Separation
# DissociationMethod
# CollisionEnergy
# MS2AnalyzerType
# ProteomicsDataAcquisitionMethod
# Strain
# CellPart
# SamplingTime
# EnrichmentMethod
# Treatment
# Region
# SyntheticPeptide
# MS2MassAnalyzer
# Temperature
# GrowthRate
# Overproduction
# SpikedCompound
# Timepoint
# Pool
# Depletion
# GeneticModification
# PooledSample
# Xenograft
# Protocol
# Staining
# StrainBreed
# Genotype
# NumberOfMissedCleavages
# AnatomicSiteTumor
# OriginSiteDisease
# TumorCellularity
# TumorGrade
# TumorStageOvaryFIGO
# Individual
# Bait
# Depletion
# Transfect
# Specimen
# RiceStrain
# SampleAmount
# BMI
# CulturedCell
# TumorSize
# ConcentrationOfCompound
# TumorStage
# TumorSite
# Time
# Experiment
# BiologicalReplicate
# FlowRateChromatogram
# GradientTime
# EnrichmentMethod
# TechnicalReplicate
# CleavageAgentDetails
# TechnicalReplicate