phanerozoic
/

dna-origin-classifier

@@ -19,12 +19,17 @@ def _index(kmer):
 class DnaOriginClassifier:
-    """Discriminative 8-mer classifier of DNA origin.
     A fixed featurizer counts all 65,536 8-mers and normalizes to within-sequence
     frequency; three discriminatively trained linear heads read it: a 5-class origin
     head and two binary detectors (host vs non-host, engineered vs natural). No
     alignment, no database. Requires only numpy and safetensors.
     """
     def __init__(self, path="model.safetensors"):
@@ -34,6 +39,7 @@ class DnaOriginClassifier:
         self.HW, self.Hb = t["host.weight"], t["host.bias"]
         self.EW, self.Eb = t["engineered.weight"], t["engineered.bias"]
     def features(self, seq):
         seq = "".join(c for c in seq.upper() if c in _B)
         v = np.zeros(VOCAB, dtype=np.float32)
@@ -61,8 +67,76 @@ class DnaOriginClassifier:
         """Higher means more likely engineered/synthetic (engineered vs natural head)."""
         return float(self.EW @ self.features(seq) + self.Eb[0])
 if __name__ == "__main__":
     clf = DnaOriginClassifier()
     seq = "ATGGCTAGCAAAGGAGAAGAACTTTTCACTGGAGTTGTCCCAATTCTTGTTGAATTAGATGGTGATGTT" * 5
-    print("origin:", clf.classify(seq), "host_score:", round(clf.host_score(seq), 3))

 class DnaOriginClassifier:
+    """Discriminative 8-mer classifier of DNA origin, with exact closed-form
+    interpretability and robustness because the model is linear in 8-mer counts.
     A fixed featurizer counts all 65,536 8-mers and normalizes to within-sequence
     frequency; three discriminatively trained linear heads read it: a 5-class origin
     head and two binary detectors (host vs non-host, engineered vs natural). No
     alignment, no database. Requires only numpy and safetensors.
+    Beyond classify/host_score/engineered_score, the linear form gives:
+      - attribute(seq): exact per-base contribution to a head (sums to the score)
+      - certify(seq):   minimum base substitutions to flip a call (greedy, exact deltas)
     """
     def __init__(self, path="model.safetensors"):
         self.HW, self.Hb = t["host.weight"], t["host.bias"]
         self.EW, self.Eb = t["engineered.weight"], t["engineered.bias"]
+    # ---- core ----
     def features(self, seq):
         seq = "".join(c for c in seq.upper() if c in _B)
         v = np.zeros(VOCAB, dtype=np.float32)
         """Higher means more likely engineered/synthetic (engineered vs natural head)."""
         return float(self.EW @ self.features(seq) + self.Eb[0])
+    # ---- closed-form interpretability and robustness ----
+    def _eff(self, head):
+        w = {"host": self.HW, "engineered": self.EW}[head]
+        return w / self.scale
+    def _bias(self, head):
+        return float({"host": self.Hb, "engineered": self.Eb}[head][0])
+    def attribute(self, seq, head="host"):
+        """Exact per-base contribution of each position to the head score.
+        The score is a sum over 8-mer windows; this distributes each window's weight
+        across its 8 bases, so the contributions sum to (score - bias) with no
+        approximation. Returns an array of length len(seq).
+        """
+        seq = "".join(c for c in seq.upper() if c in _B)
+        w = self._eff(head)
+        n = max(1, len(seq) - K + 1)
+        contrib = np.zeros(len(seq))
+        for i in range(len(seq) - K + 1):
+            j = _index(seq[i:i + K])
+            if j is None:
+                continue
+            per = w[j] / n / K
+            contrib[i:i + K] += per
+        return contrib
+    def certify(self, seq, head="host", max_edits=80):
+        """Minimum base substitutions (greedy, with exact per-edit deltas) to flip the
+        head's sign. Returns the edit count, or None if not flipped within max_edits.
+        A near-tight upper bound on the true minimum adversarial radius.
+        """
+        seq = [c for c in seq.upper() if c in _B]
+        w = self._eff(head)
+        b = self._bias(head)
+        n = max(1, len(seq) - K + 1)
+        def score(s):
+            tot = 0.0
+            for i in range(len(s) - K + 1):
+                j = _index(s[i:i + K])
+                if j is not None:
+                    tot += w[j]
+            return tot / n + b
+        sign = 1 if score("".join(seq)) > 0 else -1
+        edits = 0
+        while sign * score("".join(seq)) > 0 and edits < max_edits:
+            s = "".join(seq)
+            best_d, best = 0.0, None
+            for p in range(len(seq)):
+                wins = range(max(0, p - K + 1), min(p, n - 1) + 1)
+                old = sum(w[_index(s[a:a + K])] for a in wins if _index(s[a:a + K]) is not None)
+                for nb in BASES:
+                    if nb == seq[p]:
+                        continue
+                    s2 = s[:p] + nb + s[p + 1:]
+                    new = sum(w[_index(s2[a:a + K])] for a in wins if _index(s2[a:a + K]) is not None)
+                    d = (new - old) / n
+                    if sign * d < best_d:
+                        best_d, best = sign * d, (p, nb)
+            if best is None:
+                break
+            seq[best[0]] = best[1]
+            edits += 1
+        return edits if sign * score("".join(seq)) <= 0 else None
 if __name__ == "__main__":
     clf = DnaOriginClassifier()
     seq = "ATGGCTAGCAAAGGAGAAGAACTTTTCACTGGAGTTGTCCCAATTCTTGTTGAATTAGATGGTGATGTT" * 5
+    print("origin:", clf.classify(seq), "host_score:", round(clf.host_score(seq), 3),
+          "edits_to_flip:", clf.certify(seq), "top_base_contrib:", round(float(clf.attribute(seq).max()), 4))