
    瞤dO                        d Z dZdZdZdZi ddddd	d
dddddddddddddddddddddddddddddddddddddd ddd!Zi dd"dd#d$d%d&d'dd(d)d*d+d,dd-d.d/d0d1dd2dd3d4d5d6d7dd8dd9d:d;d<d=d>d?d@dAdBd@dCdDd@dEdFZi dGdHdIdJdKg dLdMdNdOdJdPg dQdLdRdSdTdJdPg dUdLdVdSdWdJdPg dXdLdYdSdZdJdPg d[dLd\dSd]dJdPg d^dLd_dSd`dJdPg dadLdbdSdcdJdPg dadLdddSdTdJdPg dedLdfdSdTdJdPg dgdLdhdSdWdJdPg didLdjdSdkdJdPg dldLdmdSdndJdPg dodLdpdSdqdJdPg drdLdsdSdtdJdPg dudLdvdSdwdJdPg dxdLdydzd{dJdPd|d}gdLd~d{dJdPg ddLdzdWdJdKdd}gdLdzdTdJdKg ddLddTdJdKg ddLddWdJdKg ddLddWdJdKg ddLdddJdKg ddLdddJdKg ddLdSddddPd d  ee                                          D             D             dgz   dd	Z	dS )z
Parameters for running codeml
zFrancois-Jose Serrazfrancois@barrabin.orgGPLv3z0.0seqfilealgntreefiletreeoutfileoutnoisy    verbose   runmodeseqtype   	CodonFreqclockaaDistmodelNSsitesicodeMgene	fix_kappakappandataz*10ffffff?g           z1e-6)	fix_omegaomega	fix_alphaalphaMalphancatGgetSERateAncestorfix_blength
Small_Diff	cleandatamethoda&  0:1/61 each, 1:F1X4, 2:F3X4, 3:codon table. The equilibrium codon frequencies in codon substitution model. Can be assumed to be equal (1/61 each for the standard genetic code, CodonFreq = 0), calculated from the average nucleotide frequencies (CodonFreq = 1), from the average nucleotide frequencies at the three codon positions (CodonFreq = 2), or used as free parameters (CodonFreq = 3). The number of parameters involved in those models of codon frequencies is 0, 3, 9, and 60 (for the universal code), for CodonFreq = 0, 1, 2, and 3 respectively.z0:equal, +:geometric; -:linear, 1-6:G1974,Miyata,c,p,v,a 7:AAClasses. Specifies whether equal amino acid distances are assumed (= 0) or Grantham's matrix is used (= 1) (Yang et al. 1998).r   a   initial or fixed alpha, 0:infinity (constant rate). For codon models, the pair fix_alpha and alpha specify the model of gamma rates for sites, in which the relative rate for a site varies among codons according to the gamma distribution, but the omega ratio stays the same over all sites.r&   a	  1 means sites involving ambiguity characters (undetermined nucleotides such as N, ?, W, R, Y, etc. anything other than the four nucleotides) or alignment gaps are removed from all sequences. This leads to faster calculation. cleaddata = 0 (default) uses those sitesa  0:no clock, 1:clock; 2:local clock. Specifies models concerning rate constancy or variation among lineages. clock = 0 means no clock and rates are entirely free to vary from branch to branch. An unrooted tree should be used under this model. clock = 1 means the global clock, and all branches have the same rate. The option clock = 3 is for combined analysis of multiple-gene or multiple-partition data, allowing the branch rates to vary in different ways among the data partitions (Yang and Yoder 2003). Also the variable (= 5 or 6) is used to implement the ad hoc rate smoothing procedure of Yang (2004). For clock = 1 or 2, a rooted tree should be used.r   a#  0: estimate gamma shape parameter; 1: fix it at alpha. For codon models, the pair fix_alpha and alpha specify the model of gamma rates for sites, in which the relative rate for a site varies among codons according to the gamma distribution, but the omega ratio stays the same over all sites.r$   a  0: ignore, -1: random, 1: initial, 2: fixed. This tells the program what to do if the tree has branch lengths. Use 0 if you want to ignore the branch lengths. Use -1 if you want the program to start from random starting points. This might be useful if there are multiple local optima. Use 1 if you want to use the branch lengths as initial values for the ML iteration. Use 2 if you want the branch lengths to be fixed at those given in the tree file (rather than estimating them by ML).a$  1: kappa fixed, 0: kappa to be estimated. Specifies whether kappa in K80, F84, or HKY85 is given at a fixed value or is to be estimated by iteration from the data. If fix_kappa = 1, the value of another variable, kappa , is the given value, and otherwise the value of kappa is used as the initial estimate for iteration. The variables fix_kappa and kappa have no effect with JC69 or F81 which does not involve such a parameter, or with TN93 and REV which have two and five rate parameters respectively, when all of them are estimated from the data.r   z&1: omega or omega_1 fixed, 0: estimater"   z0: don't want them, 1: want S.E.s of estimates. Tells whether we want estimates of the standard errors of estimated parameters.a  specifies the genetic code. Eleven genetic code tables are implemented using icode = 0 to 10 corresponding to transl_table 1 to 11 in GenBank. These are 0 for the universal code; 1 for the mammalian mitochondrial code; 3 for mold mt., 4 for invertebrate mt.; 5 for ciliate nuclear code; 6 for echinoderm mt.; 7 for euplotid mt.; 8 for alternative yeast nuclear; 9 for ascidian mt.; and 10 for blepharisma nuclear. There is also an additional code, called Yang's regularized code, specified by icode = 11.zM0: estimate gamma shape parameter; 1: fix it at alpha. Initial or fixed kappar    zdifferent alphas for genes. Specifies whether one gamma distribution will be applied across all sites (Malpha = 0) or a different gamma distribution is used for each gene (or codon position).r'   a  0: simultaneous; 1: one branch at a time. This variable controls the iteration algorithm for estimating branch lengths under a model of no clock. method = 0 implements the old algorithm in PAML, which updates all parameters including branch lengths simultaneously. method = 1 specifies an algorithm newly implemented in PAML, which updates branch lengths one by one. method = 1 does not work under the clock models (clock = 1, 2, 3).z0:rates, 1:separate. In combination with option G in the sequence data file, specifies partition models (Yang and Swanson 2002)a  specifies the branch models (Yang 1998; Yang and Nielsen 1998). model = 0 means one omega ratio for all branches; 1 means one ratio for each branch (the free-ratio model); and 2 means an arbitrary number of ratios (such as the 2-ratios or 3-ratios models). When model = 2, you have to group branches on the tree into branch groups using the symbols # or $ in the tree. With model = 2, the variable fix_omega fixes the last omega ratio ( omega(k-1) if you have k ratios in total) at the value of omega specified in the file.r!   a  is then the number of categories for the discrete-gamma model ( baseml ). Values such as 5, 4, 8, or 10 are reasonable. Note that the discrete gamma model has one parameter (alpha), like the continuous gamma model, and the number of categories is not a parameter.z7specifies the number of separate data sets in the file.z*0,1,2,3,9: how much rubbish on the screen.ab  0:one w; 1:neutral; 2:selection; 3:discrete; 4:freqs; 5:gamma; 6:2gamma; 7:beta; 8:beta&w; 9:beta&gamma; 10:beta&gamma+1; 11:beta&normal>1; 12:0&2normal>1; 13:3normal>0. Specifies the site models, with NSsites = m corresponds to model Mm in Yang et al. (2000b). The variable ncatG is used to specify the number of categories in the omega distribution under some models. In Yang et al. (2000b), this is 3 for M3 (discrete), 5 for M4 (freq), 10 for the continuous distributions (M5: gamma, M6: 2gamma, M7: beta, M8:beta&w, M9:beta&gamma, M10: beta&gamma+1, M11:beta&normal>1, and M12:0&2normal>1, M13:3normal>0).z5initial or fixed omega, for codons or codon-based AAsa  specifies the names of the sequence data file, main result file, and the tree structure file, respectively. You should not have spaces inside a file name. In general try to avoid special characters in a file name as they might have special meanings under the OS.a|  Usually use 0. The value 1 forces the program to do two additional analyses, which you can ignore if you don't need the results. First under a model of variable rates across sites such as the gamma, RateAncestor = 1 forces the program to calculate rates for individual sites along the sequence (output in the file rates ), using the empirical Bayes procedure (Yang and Wang 1995).zg0: user tree; 1: semi-automatic; 2: automatic 3: StepwiseAddition; (4,5):PerturbationNNI; -2: pairwise.z1:codons; 2:AAs; 3:codons-->AAszis a small value used in the difference approximation of derivatives. Use a value between 1e-8 and 1e-5 and check that the results are not sensitive to the value used.z%1: detailed output, 0: concise output)r   r	   r   r   r   r#   r   r   r   r%   r   r   XXUnknownzUser definedcodemlT)typevolexec
allow_markchangesM0nullznegative-selectionF)r   r
   r   *r'   r4   r    r4   r   r4   M1site
relaxation))r   r   r3   r5   r6   r7   M2zpositive-selection)r   r   r   g333333?r3   r5   r6   r7   M3discrete)r      r   r   r!   rA   r3   r5   r6   r7   M4frequencies))r      rB   r3   r5   r6   r7   M5gamma))r      rB   r3   r5   r6   r7   M6z2 gammaM7))r      r3   r5   r6   r7   M8a)r   r   r   r   r   r   r3   r5   r6   r7   M8)rN   r=   r3   r5   r6   r7   M9zbeta and gamma))r   	   r3   r5   r6   r7   M10zbeta and gamma + 1))r   
   r3   r5   r6   r7   M11zbeta and normal > 1))r      r3   r5   r6   r7   M12z0 and 2 normal > 2))r      r3   r5   r6   r7   M13z3 normal > 0))r      r3   r5   r6   r7   fbbranchzfree-ratiosr   r   r2   branch_ancestor)r^   )r#   r   r2   r   r   )r`   r2   rO   rP   zbranch-site)r`   r<   rO   rP   r!   r4   )r`   r<   r=   ra   )r`   r@   r=   ra   zdifferent-ratios)r   rA   r<   rC   )rb   r@   rC   zpositive/negative selectionSlrz= c                 "    g | ]}|d          dfS )r
   r4    .0xs     1lib/python3.11/site-packages/ete3/evol/control.py
<listcomp>rj   6  s     iiiAQqT3Kiii    c                 &    g | ]}d |d         v|S )filer
   re   rf   s     ri   rj   rj   6  s*    1h1h1hU[cdefcgUgUg!UgUgUgrk   )positive_only0)r+   r,   r-   sepr.   r/   )	fb_ancb_freeb_neutbsA1bsAbsBbsCbsDSLRN)
__doc__
__author__	__email____licence____version__PARAMSPARAMS_DESCRIPTIONlistitemsAVAILre   rk   ri   <module>r      sF  P  $
%	
V
V
 U
 Q	

 Q
 Q
 Q
 Q
 Q
 Q
 Q
 Q
 Q
 Q
 Q
  Q!
" U#
$ ;
 
 
B  ~  T   x   a	
   h
   {   ~   | =   X   Q d   W   I   W    c!"   _#$ OA z	L ^ U~ ^6  ^<;   @E	y " E	
 	v.B #3 3 34 4E	 	vl #3 3 34 4E	* 	v.B #3 3 34 4+E	< 	vj #3 3 3	4 	4=E	P 	vm #3 3 34 4QE	b 	vg #3 3 34 4cE	t 	vi #3 3 34 4uE	F 	vl #3 3 34 4GE	V 
vl #3 3 3	4 	4WE	j 	v.B #3 3 34 4kE	| 	v.> #3 3 34 4}E	L 
v.B #3 3 34 4ME	\ 
v.C #3 3 34 4]E	l 
v.B #3 3 34 4mE	| 
vn #3 3 34 4}E	L 	xm #//12 2ME	V )] #1 1 12 2  .B "//12 2
  l "1 1 12 2 %l "3 3 34 4 %.B "3 3 34 4 %.B "3 3 34 4 %.@ "1 1 12 2 %.@ "1 1 12 2 (E#ii1h1hTT&,,..=Q=Q1h1h1hiii'()	* *E	 E	 E	rk   