marrink-lab · csbrasnett · Nov 4, 2024 · Nov 4, 2024 · Nov 4, 2024 · Nov 4, 2024
diff --git a/bin/martinize2 b/bin/martinize2
@@ -78,6 +78,9 @@ LOGGER = StyleAdapter(LOGGER)
 
 VERSION = "martinize with vermouth {}".format(vermouth.__version__)
 
+SS_CG = {'1': 'H', '2': 'H', '3': 'H', 'H': 'H', 'G': 'H', 'I': 'H',
+         'B': 'E', 'E': 'E', 'T': 'T', 'S': 'S', 'C': 'C'}
+
 
 def read_system(path, ignore_resnames=(), ignh=None, modelidx=None):
     """
@@ -952,16 +955,6 @@ def entry():
                            'for this force field',
                            type="missing-feature")
 
-    ss_sequence = list(
-        itertools.chain(
-            *(
-                dssp.sequence_from_residues(molecule, "secstruct")
-                for molecule in system.molecules
-                if selectors.is_protein(molecule)
-            )
-        )
-    )
-
     if args.cystein_bridge == "none":
         vermouth.RemoveCysteinBridgeEdges().run_system(system)
     elif args.cystein_bridge != "auto":
@@ -977,6 +970,17 @@ def entry():
         disordered_regions=args.water_idrs
     )
 
+    ss_sequence = list(
+        itertools.chain(
+            *(
+                SS_CG[i]
+                for i in dssp.sequence_from_residues(molecule, "cgsecstruct")
+                for molecule in system.molecules
+                if selectors.is_protein(molecule) if i is not None
+            )
+        )
+    )
-    ss_sequence = list(
-        itertools.chain(
-            *(
-                SS_CG[i]
-                for i in dssp.sequence_from_residues(molecule, "cgsecstruct")
-                for molecule in system.molecules
-                if selectors.is_protein(molecule) if i is not None
-            )
-        )
-    )
+    ss_sequence = list(
+        itertools.chain(
+            *(
+                dssp.convert_dssp_to_martini(dssp.sequence_from_residues(molecule, "cgsecstruct"))
+                for molecule in system.molecules
+                if selectors.is_protein(molecule) if i is not None
+            )
+        )
+    )
-    ss_sequence = list(
-        itertools.chain(
-            *(
-                SS_CG[i]
-                for i in dssp.sequence_from_residues(molecule, "cgsecstruct")
-                for molecule in system.molecules
-                if selectors.is_protein(molecule) if i is not None
-            )
-        )
-    )
+    ss_sequence = list(
+        itertools.chain(
+            *(
+                dssp.convert_dssp_to_martini(dssp.sequence_from_residues(molecule, "cgsecstruct"))
+                for molecule in system.molecules
+                if selectors.is_protein(molecule) if i is not None
+            )
+        )
+    )
+
     # Apply position restraints if required.
     if args.posres != "none":
         LOGGER.info("Applying position restraints.", type="step")
@@ -1004,6 +1008,12 @@ def entry():
         defines = ("GO_VIRT",)
         itp_paths = {"atomtypes": "go_atomtypes.itp",
                      "nonbond_params": "go_nbparams.itp"}
+        if not args.water_bias:
+            # this ensures that disordered-folded go bonds get removed regardless of force field.
+            vermouth.processors.ComputeWaterBias(args.water_bias,
+                                                 {s: float(eps) for s, eps in args.water_bias_eps},
+                                                 [(int(start), int(stop)) for start, stop in args.water_idrs],
+                                                ).run_system(system)
     else:
         # don't write non-bonded interactions
         itp_paths = []