diff test-data/funannotate_db/trained_species/fly/augustus/fly_weightmatrix.txt @ 0:998b719a94cb draft

"planemo upload commit 9613152729099079c7465c3d5d42005ef22ca91e"
author iuc
date Thu, 26 Aug 2021 06:56:18 +0000
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/trained_species/fly/augustus/fly_weightmatrix.txt	Thu Aug 26 06:56:18 2021 +0000
@@ -0,0 +1,23 @@
+# 
+# This file contains a matrix used for weighing the training sequences
+# when given an input sequence. Let z = (da, dc, dg, dt) be the vector
+# containing the differences in the relative nucleotide frequencies of
+# two sequences, the input sequence and a training sequence.
+# Then the training sequence has weight proportional to 
+#
+# exp ( - z M z^t)
+#
+# with M being the matrix specified below.
+# If M is nonsingular, then (apart from a two normalizing factors) M
+# is the inverse of the covariance matrix of a multinormal
+# distribution - the kernel for the estimation.
+
+
+# this matrix is gc-content only, i.e. 
+# weight = 10 * exp (-200 * (dc + dg))^2)
+# in particular weight <= 10
+0      0      0             0
+0      200    0             0
+0      0      200           0
+0      0      0             0
+