hmm.rar_HMM_HMMjavasourcecode_hmmjavacode_videovoice_视频语音

共2个文件

txt：1个

java：1个

版权申诉

视频语音

103 浏览量 2022-09-20 14:28:45 上传评论收藏 5KB RAR 举报

资源推荐

资源详情

资源评论

收起资源包目录

hmm.rar （2个子文件）

hmm.java 19KB

www.pudn.com.txt 218B

// Implementation of some algorithms for pairwise alignment from // Durbin et al: Biological Sequence Analysis, CUP 1998, chapter 3. // Peter Sestoft, [email protected] (Oct 1999), 2001-08-20 version 0.7 // Reference: http://www.dina.kvl.dk/~sestoft/bsa.html // License: Anybody can use this code for any purpose, including // teaching, research, and commercial purposes, provided proper // reference is made to its origin. Neither the author nor the Royal // Veterinary and Agricultural University, Copenhagen, Denmark, can // take any responsibility for the consequences of using this code. // Compile with: // javac Match3.java // Run with: // java Match3 // Notational conventions: // i = 1,...,L indexes x, the observed string, x_0 not a symbol // k,ell = 0,...,hmm.nstate-1 indexes hmm.state(k) a_0 is the start state import java.text.*; import java.util.*; // Some algorithms for Hidden Markov Models (Chapter 3): Viterbi, // Forward, Backward, Baum-Welch. We compute with log probabilities. class HMM { // State names and state-to-state transition probabilities int nstate; // number of states (incl initial state) String[] state; // names of the states double[][] loga; // loga[k][ell] = log(P(k -> ell)) // Emission names and emission probabilities int nesym; // number of emission symbols String esym; // the emission symbols e1,...,eL (characters) double[][] loge; // loge[k][ei] = log(P(emit ei in state k)) // Input: // state = array of state names (except initial state) // amat = matrix of transition probabilities (except initial state) // esym = string of emission names // emat = matrix of emission probabilities public HMM(String[] state, double[][] amat, String esym, double[][] emat) { if (state.length != amat.length) throw new IllegalArgumentException("HMM: state and amat disagree"); if (amat.length != emat.length) throw new IllegalArgumentException("HMM: amat and emat disagree"); for (int i=0; i<amat.length; i++) { if (state.length != amat[i].length) throw new IllegalArgumentException("HMM: amat non-square"); if (esym.length() != emat[i].length) throw new IllegalArgumentException("HMM: esym and emat disagree"); } // Set up the transition matrix nstate = state.length + 1; this.state = new String[nstate]; loga = new double[nstate][nstate]; this.state[0] = "B"; // initial state // P(start -> start) = 0 loga[0][0] = Double.NEGATIVE_INFINITY; // = log(0) // P(start -> other) = 1.0/state.length double fromstart = Math.log(1.0/state.length); for (int j=1; j<nstate; j++) loga[0][j] = fromstart; for (int i=1; i<nstate; i++) { // Reverse state names for efficient backwards concatenation this.state[i] = new StringBuffer(state[i-1]).reverse().toString(); // P(other -> start) = 0 loga[i][0] = Double.NEGATIVE_INFINITY; // = log(0) for (int j=1; j<nstate; j++) loga[i][j] = Math.log(amat[i-1][j-1]); } // Set up the emission matrix this.esym = esym; nesym = esym.length(); // Assume all esyms are uppercase letters (ASCII <= 91) loge = new double[emat.length+1][91]; for (int b=0; b<nesym; b++) { // Use the emitted character, not its number, as index into loge: char eb = esym.charAt(b); // P(emit xi in state 0) = 0 loge[0][eb] = Double.NEGATIVE_INFINITY; // = log(0) for (int k=0; k<emat.length; k++) loge[k+1][eb] = Math.log(emat[k][b]); } } public void print(Output out) { printa(out); printe(out); } public void printa(Output out) { out.println("Transition probabilities:"); for (int i=1; i<nstate; i++) { for (int j=1; j<nstate; j++) out.print(fmtlog(loga[i][j])); out.println(); } } public void printe(Output out) { out.println("Emission probabilities:"); for (int b=0; b<nesym; b++) out.print(esym.charAt(b) + hdrpad); out.println(); for (int i=1; i<loge.length; i++) { for (int b=0; b<nesym; b++) out.print(fmtlog(loge[i][esym.charAt(b)])); out.println(); } } private static DecimalFormat fmt = new DecimalFormat("0.000000 "); private static String hdrpad = " "; public static String fmtlog(double x) { if (x == Double.NEGATIVE_INFINITY) return fmt.format(0); else return fmt.format(Math.exp(x)); } // The Baum-Welch algorithm for estimating HMM parameters for a // given model topology and a family of observed sequences. // Often gets stuck at a non-global minimum; depends on initial guess. // xs is the set of training sequences // state is the set of HMM state names // esym is the set of emissible symbols public static HMM baumwelch(String[] xs, String[] state, String esym, final double threshold) { int nstate = state.length; int nseqs = xs.length; int nesym = esym.length(); Forward[] fwds = new Forward[nseqs]; Backward[] bwds = new Backward[nseqs]; double[] logP = new double[nseqs]; double[][] amat = new double[nstate][]; double[][] emat = new double[nstate][]; // Set up the inverse of b -> esym.charAt(b); assume all esyms <= 'Z' int[] esyminv = new int[91]; for (int i=0; i<esyminv.length; i++) esyminv[i] = -1; for (int b=0; b<nesym; b++) esyminv[esym.charAt(b)] = b; // Initially use random transition and emission matrices for (int k=0; k<nstate; k++) { amat[k] = randomdiscrete(nstate); emat[k] = randomdiscrete(nesym); } HMM hmm = new HMM(state, amat, esym, emat); double oldloglikelihood; // Compute Forward and Backward tables for the sequences double loglikelihood = fwdbwd(hmm, xs, fwds, bwds, logP); System.out.println("log likelihood = " + loglikelihood); // hmm.print(new SystemOut()); do { oldloglikelihood = loglikelihood; // Compute estimates for A and E double[][] A = new double[nstate][nstate]; double[][] E = new double[nstate][nesym]; for (int s=0; s<nseqs; s++) { String x = xs[s]; Forward fwd = fwds[s]; Backward bwd = bwds[s]; int L = x.length(); double P = logP[s]; // NOT exp. Fixed 2001-08-20 for (int i=0; i<L; i++) { for (int k=0; k<nstate; k++) E[k][esyminv[x.charAt(i)]] += exp(fwd.f[i+1][k+1] + bwd.b[i+1][k+1] - P); } for (int i=0; i<L-1; i++) for (int k=0; k<nstate; k++) for (int ell=0; ell<nstate; ell++) A[k][ell] += exp(fwd.f[i+1][k+1] + hmm.loga[k+1][ell+1] + hmm.loge[ell+1][x.charAt(i+1)] + bwd.b[i+2][ell+1] - P); } // Estimate new model parameters for (int k=0; k<nstate; k++) { double Aksum = 0; for (int ell=0; ell<nstate; ell++) Aksum += A[k][ell]; for (int ell=0; ell<nstate; ell++) amat[k][ell] = A[k][ell] / Aksum; double Eksum = 0; for (int b=0; b<nesym; b++) Eksum += E[k][b]; for (int b=0; b<nesym; b++) emat[k][b] = E[k][b] / Eksum; } // Create new model hmm = new HMM(state, amat, esym, emat); loglikelihood = fwdbwd(hmm, xs, fwds, bwds, logP); System.out.println("log likelihood = " + loglikelihood); // hmm.print(new SystemOut()); } while (Math.abs(oldloglikelihood - loglikelihood) > threshold); return hmm; } private static double fwdbwd(HMM hmm, String[] xs, Forward[] fwds, Backward[] bwds, double[] lo

评论收藏

内容反馈

版权申诉