yzhang@u.duke.nus.edu commited on
Commit
f652da3
·
1 Parent(s): e1aee79

add sequence 2 smiles feature

Browse files
Files changed (1) hide show
  1. app.py +29 -0
app.py CHANGED
@@ -108,6 +108,35 @@ class PeptideAnalyzer:
108
  self.clean_smiles_lookup = {}
109
  self.uaa_internal_exact = {}
110
  self.uaa_internal_patterns = []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
111
 
112
  for uaa_name, uaa_data in all_aminos.items():
113
  code = uaa_data["Code"]
 
108
  self.clean_smiles_lookup = {}
109
  self.uaa_internal_exact = {}
110
  self.uaa_internal_patterns = []
111
+ for uaa_name, uaa_data in specific_aminos.items():
112
+ code = uaa_data["Code"]
113
+ smiles = uaa_data.get("SMILES", "")
114
+ nterm = uaa_data.get("nterm", "")
115
+ cterm = uaa_data.get("cterm", "")
116
+ letter = uaa_data.get("Letter")
117
+
118
+ # keep existing full-aa lookups
119
+ if smiles:
120
+ self.exact_smiles_lookup[smiles] = code
121
+ clean = self._remove_stereochemistry(smiles)
122
+ self.clean_smiles_lookup.setdefault(clean, []).append(code)
123
+
124
+ internal = ""
125
+ if cterm:
126
+ internal = _internal_from_cterm(cterm)
127
+ elif nterm:
128
+ internal = _internal_from_nterm(nterm)
129
+
130
+ if internal:
131
+ self.exact_smiles_lookup[internal] = code
132
+ clean_int = self._remove_stereochemistry(internal)
133
+ self.clean_smiles_lookup.setdefault(clean_int, []).append(code)
134
+
135
+ self.uaa_internal_exact[code] = internal
136
+ self.uaa_internal_patterns.append((_chirality_agnostic_regex(internal), code))
137
+
138
+ if letter:
139
+ self.three_to_one[code] = letter
140
 
141
  for uaa_name, uaa_data in all_aminos.items():
142
  code = uaa_data["Code"]