better errors with 20A structures

Louis BECQUEY
Commit cf484aad6f77381a56a61599b8b6c1f69d06bcc9 cf484aad 1 parent c9cbadf0
Showing 1 changed file with 24 additions and 21 deletions
RNAnet.py
--- a/RNAnet.py
View file @cf484aa
+++ b/RNAnet.py
View file @cf484aa
@@ -252,14 +252,23 @@ class Chain:
         while True in df.duplicated(['nt_resnum']).values:
             i = df.duplicated(['nt_resnum']).values.tolist().index(True)
             df.iloc[i:, 1] += 1
-            
+
         # Drop ligands detected as residues by DSSR, by detecting several markers
         df = df.drop_duplicates("index_chain", keep="first") # drop doublons in index_chain
-        while (df.iloc[[-1]].nt_name.tolist()[0] not in ["A", "C", "G", "U"] and 
+        while (len(df.index_chain) and df.iloc[[-1]].nt_name.tolist()[0] not in ["A", "C", "G", "U"] and 
-              (df.iloc[[-1]][["alpha", "beta", "gamma", "delta", "epsilon", "zeta", "v0", "v1", "v2", "v3", "v4"]].isna().values).all()
+            ((df.iloc[[-1]][["alpha", "beta", "gamma", "delta", "epsilon", "zeta", "v0", "v1", "v2", "v3", "v4"]].isna().values).all()
-               or (df.iloc[[-1]].puckering=='').any()):
+            or (df.iloc[[-1]].puckering=='').any())):
             df = df.head(-1) 
+        # Assert some nucleotides exist
+        try:
+            l = df.iloc[-1,1] - df.iloc[0,1] + 1    # length of chain from nt_resnum point of view
+        except IndexError:
+            warn(f"Error while parsing DSSR's annotation: No nucleotides are part of {self.chain_label}!", error=True)
+            self.delete_me = True
+            self.error_messages = f"Error while parsing DSSR's json output: No nucleotides from {self.chain_label}. We expect a problem with {self.pdb_id} mmCIF download. Delete it and retry."
+            return 1
+
         # If, for some reason, index_chain does not start at one (e.g. 6boh, chain GB), make it start at one
         if df.iloc[0,0] != 1:
             st = df.iloc[0,0] -1
@@ -292,13 +301,6 @@ class Chain:
         # index_chain            1 |-------------|77 83|------------|  149
         # expected data point    1 |--------------------------------|  154
         #
-        try:
-            l = df.iloc[-1,1] - df.iloc[0,1] + 1    # length of chain from nt_resnum point of view
-        except IndexError:
-            warn(f"Error while parsing DSSR's annotation: No nucleotides are part of {self.chain_label}!", error=True)
-            self.delete_me = True
-            self.error_messages = f"Error while parsing DSSR's json output: No nucleotides from {self.chain_label}. We expect a problem with {self.pdb_id} mmCIF download. Delete it and retry."
-            return 1
         if l != len(df['index_chain']):         # if some residues are missing, len(df['index_chain']) < l
             resnum_start = df.iloc[0,1]
@@ -851,7 +853,7 @@ class Pipeline:
                 print("RNANet 1.0 alpha ")
                 sys.exit()
             elif opt == "-r" or opt == "--resolution":
-                assert float(arg) > 0.0 and float(arg) < 20.0 
+                assert float(arg) > 0.0 and float(arg) <= 20.0 
                 self.CRYSTAL_RES = float(arg)
             elif opt == "-s":
                 self.RUN_STATS = True
@@ -1770,14 +1772,15 @@ def work_build_chain(c, extract, khetatm, retrying=False):
         c.extract_3D_data()
     # Small check
-    with sqlite3.connect(runDir+"/results/RNANet.db", timeout=10.0) as conn:
+    if not c.delete_me:
-        nnts = sql_ask_database(conn, f"SELECT COUNT(nt_id) FROM nucleotide WHERE chain_id={c.db_chain_id};", warn_every=10)[0][0]
+        with sqlite3.connect(runDir+"/results/RNANet.db", timeout=10.0) as conn:
-    if not(nnts):
+            nnts = sql_ask_database(conn, f"SELECT COUNT(nt_id) FROM nucleotide WHERE chain_id={c.db_chain_id};", warn_every=10)[0][0]
-        warn(f"Nucleotides not inserted: {c.error_messages}")
+        if not(nnts):
-        c.delete_me = True
+            warn(f"Nucleotides not inserted: {c.error_messages}")
-        c.error_messages = "Nucleotides not inserted !"
+            c.delete_me = True
-    else:
+            c.error_messages = "Nucleotides not inserted !"
-        notify(f"Inserted {nnts} nucleotides to chain {c.chain_label}")
+        else:
+            notify(f"Inserted {nnts} nucleotides to chain {c.chain_label}")
     # extract the portion we want
     if extract and not c.delete_me:
@@ -2095,7 +2098,7 @@ if __name__ == "__main__":
     # compute an update compared to what is in the table "chain"
     #DEBUG: list everything
-    # pp.REUSE_ALL = True
+    pp.REUSE_ALL = True
     pp.list_available_mappings()
     # ===========================================================================