# HG changeset patch
# User iracooke
# Date 1393999462 18000
# Node ID 5d3626c860719e7f38e3cf81fdd7a2ad0a3b976c
# Parent  15c2dda543b36f0ba227d7158894d4747f8b67d7
Uploaded
diff -r 15c2dda543b3 -r 5d3626c86071 README
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/README	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,7 @@
+This package is a galaxy wrapper for the MSGF+ search tool.
+
+Requirements:
+This package depends on the galaxy_protk, protk_msgfplus, protk_proteowizard packages
+Please see instructions for those packages before installing
+
+In addition to basic requirements you must also have unzip and java 6 runtime (or greater) installed
diff -r 15c2dda543b3 -r 5d3626c86071 README.md
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/README.md	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,8 @@
+## What is it?
+Galaxy tool definition file and wrapper scripts for the [MSGF+ Search Engine](http://proteomics.ucsd.edu/Software/MSGFPlus.html).
+
+## Installation
+Install from the main galaxy toolshed at http://toolshed.g2.bx.psu.edu/
+
+Depends on command-line scripts and databases available in the [protk ruby gem](https://bitbucket.org/iracooke/protk). 
+
diff -r 15c2dda543b3 -r 5d3626c86071 msgfplus_search.xml
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/msgfplus_search.xml	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,185 @@
+
+    Run an MSGF+ Search
+    
+        protk
+        msgfplus
+        proteowizard
+    
+    
+        msgfplus_search.rb
+        #if $database.source_select=="built_in":
+         --galaxy -d $database.dbkey
+        #else
+        --galaxy -d $database.fasta_file
+        #end if
+
+        --var-mods='
+        $variable_mods
+        #for $custom_variable_mod in $custom_variable_mods:
+        ,${custom_variable_mod.custom_mod}
+        #end for
+        '
+
+        --fix-mods='
+        $fixed_mods
+        #for $custom_fix_mod in $custom_fix_mods:
+        ,${custom_fix_mod.custom_mod}
+        #end for
+        '
+
+        $input_file 
+        -o $output 
+        -r 
+        --enzyme=$enzyme 
+        --precursor-ion-tol-units=$precursor_tolu 
+        -v $missed_cleavages 
+        -f $fragment_ion_tol 
+        -p $precursor_ion_tol 
+        --instrument=$instrument
+        --isotope-error-range=$isotope_error_range
+        --fragment-method=$fragment_method
+        --protocol=$protocol
+        --min-pep-len=$min_pep_len
+        --max-pep-len=$max_pep_len
+        --max-pep-charge=$max_pep_charge
+        --min-pep-charge=$min_pep_charge
+        --num-reported-matches=$num_reported_matches
+        --java-mem=$java_mem
+        #unless $pepxml_output_use:
+        --no-pepxml
+        #end if
+    
+
+    
+        
+            
+                
+                
+            
+            
+                
+                    
+                    
+                        
+                        
+                    
+                
+            
+            
+                
+            
+        
+        
+        
+            
+                
+                
+            
+        
+        
+            
+        
+        
+            
+                
+                
+            
+        
+        
+            
+            
+        
+        
+            
+            
+            
+            
+        
+        
+        
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+        
+        
+        
+            
+            
+            
+            
+        
+
+        
+            
+            
+            
+            
+            
+            
+        
+
+        
+            
+            
+            
+            
+            
+        
+
+        
+
+        
+        
+            
+            
+            
+        
+
+        
+        
+        
+        
+        
+        
+        
+        
+    
+    
+        
+            
+                
+            
+        
+    
+    
+        
+            
+              
+                  
+               
+        
+    
+    
+
+**What it does**
+
+Runs an MS/MS database search using the MSGFPlus search engine. Output is in the form of a pepXML file containing identified peptides along with their raw search scores.
+
+----
+
+**References**
+
+Please see http://proteomics.ucsd.edu/Software/MSGFPlus.html for details of the MSGFPlus search engine and references describing its algorithm
+
+    
+
diff -r 15c2dda543b3 -r 5d3626c86071 repository_dependencies.xml
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/repository_dependencies.xml	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,4 @@
+
+
+    
+ 
diff -r 15c2dda543b3 -r 5d3626c86071 test-data/bsa.fasta
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/bsa.fasta	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,26 @@
+>sp|ALBU_BOVIN|
+MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGEEHFKGLVLIA
+FSQYLQQCPFDEHVKLVNELTEFAKTCVADESHAGCEKSLHTLFGDELCK
+VASLRETYGDMADCCEKQEPERNECFLSHKDDSPDLPKLKPDPNTLCDEF
+KADEKKFWGKYLYEIARRHPYFYAPELLYYANKYNGVFQECCQAEDKGAC
+LLPKIETMREKVLASSARQRLRCASIQKFGERALKAWSVARLSQKFPKAE
+FVEVTKLVTDLTKVHKECCHGDLLECADDRADLAKYICDNQDTISSKLKE
+CCDKPLLEKSHCIAEVEKDAIPENLPPLTADFAEDKDVCKNYQEAKDAFL
+GSFLYEYSRRHPEYAVSVLLRLAKEYEATLEECCAKDDPHACYSTVFDKL
+KHLVDEPQNLIKQNCDQFEKLGEYGFQNALIVRYTRKVPQVSTPTLVEVS
+RSLGKVGTRCCTKPESERMPCTEDYLSLILNRLCVLHEKTPVSEKVTKCC
+TESLVNRRPCFSALTPDETYVPKAFDEKLFTFHADICTLPDTEKQIKKQT
+ALVELLKHKPKATEEQLKTVMENFVAFVDKCCAADDKEACFAVEGPKLVV
+STQTALA
+>sp|AMYS_HUMAN|
+MKLFWLLFTIGFCWAQYSSNTQQGRTSIVHLFEWRWVDIALECERYLAPK
+GFGGVQVSPPNENVAIHNPFRPWWERYQPVSYKLCTRSGNEDEFRNMVTR
+CNNVGVRIYVDAVINHMCGNAVSAGTSSTCGSYFNPGSRDFPAVPYSGWD
+FNDGKCKTGSGDIENYNDATQVRDCRLSGLLDLALGKDYVRSKIAEYMNH
+LIDIGVAGFRIDASKHMWPGDIKAILDKLHNLNSNWFPEGSKPFIYQEVI
+DLGGEPIKSSDYFGNGRVTEFKYGAKLGTVIRKWNGEKMSYLKNWGEGWG
+FMPSDRALVFVDNHDNQRGHGAGGASILTFWDARLYKMAVGFMLAHPYGF
+TRVMSSYRWPRYFENGKDVNDWVGPPNDNGVTKEVTINPDTTCGNDWVCE
+HRWRQIRNMVNFRNVVDGQPFTNWYDNGSNQVAFGRGNRGFIVFNNDDWT
+FSLTLQTGLPAGTYCDVISGDKINGNCTGIKIYVSDDGKAHFSISNSAED
+PFIAIHAESKL
\ No newline at end of file
diff -r 15c2dda543b3 -r 5d3626c86071 test-data/bsa.mzML
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/bsa.mzML	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,96 @@
+
+
+  
+    
+      
+      
+    
+    
+      
+        
+        
+      
+      
+        
+          
+          
+          
+        
+      
+    
+    
+      
+        
+      
+    
+    
+      
+        
+      
+    
+    
+      
+        
+          
+        
+        
+          
+        
+      
+    
+    
+      
+        
+          
+          
+          
+          
+          
+          
+          
+          
+          
+          
+          
+            
+            
+            
+          
+          
+            
+              
+                
+                  
+                  
+                
+              
+              
+              
+            
+          
+          
+            
+              
+              
+              
+              RPrt68CEaUDI7236swRrQLecS3FVwmxAdcjNcANFbUBlwi/182NuQL/xtWeWAm9AGm7A54clb0BNSkG3FyJxQJOMnIU9QXFAFCLgEKpScUCe6pCb4fJyQNbiUwAME3RA529CIQJSdUDmllZDYmJ2QFch5SfVQXdAOiNKe4NRd0A2WaMeolJ4QGwE4nX9YXhAG7tE9VZyeUAaNPRPcNN6QDyInSl0JHtAEqCmli1Te0CuDRXj/JJ7QBsS91h6gnxAet/42jOzfEC94xQdyZJ9QEbT2clgMn5Ah78ma9RCf0CAYI4ev1J/QPCiryCNKoBAqiuf5XkxgEDtuyL4H3qAQDI4Sl7dgYBAEVMiiZ66gEBi+IiY0tGAQDMbZJKR2YBAjL6CNCMKgUA0ETY8vUGBQEymCkYlUoFAzzEge71hgUB8D5cc97WBQKYnLPHAuYFArDlAMEfigUBWSPlJ9fGBQP2H9NsX/oFApMLYQlApgkBmFMstLUKCQG2tLxLaWYJAMPDce3ixgkAYsrrVc7mCQHAlOzbCOYNAPrMkQI1Bg0Ang6PkFWqDQOrPfqRIgoNAdZMYBBaKg0BaL4ZyIrqDQGIQWDm0woNANUHUfcDJg0AMAiuHVgqEQCzUmubdUoRAL6NYbilqhEDXwFYJlpqEQGjon+CiooRA9Pi9TT/ShEBrZcIvNdqEQBqjdVR16oRAs5jYfBzyhEBx5ldzwFGFQIz4Tsx6eoVAhPBo4wiKhUCCHJQwE5KFQCUGgZUD0oVAy9b6IuHZhUBeukkMAmKGQM11Gmkp8oZA1xcJbTnDh0AWwf9WMsuHQJhRLLd0SohAldQJaGJTiEAUyy2thoKIQNuizAbZColAjZyFPa0SiUDLSpNSkGKJQCveyDzymolAS80eaMXqiUB47j1csvKJQONTAIzneopAejarPlfTikAMPPcerlOLQDdPdciNW4tA1EM0usPji0CY3ZOHBauMQD90QX3L845A/+xHigh8j0D7OnDOKPaRQAUXK2oQ+pFAbqMBvCU+kkA=
+            
+            
+              
+              
+              
+              AABIQgAAUEIAAMpCAABkQwAA8EEAACBCAEAHRQAAgEIAACRDAICRQwAAhEIAAE9EAADwQQAAjkIAAAhCAAAEQgAAMEIAAChDAACmQgAA4EEAAJBDAADGQgAA1EIAAHhCAAAEQwAAHEMAAKpCAAAcQgAAgUMAALRCAIDuQwAADEIAAJxCAMCERAAAOEIAADlDAAAAQgAA3kIAAPxCAICfQwAASUMAAAtDAADoQQAA00MAgMNDAADoQQAA+UMAAOBBAABUQgAAH0MAAExCAICFQwAA+EEAABxCAACMQgAAIEIAAKhCAIDVQwAAKEMAAFpEAAAIQgAABEIAAOBBAAAMQgAA4EEAAIpCAAA1QwAA+EIAAFBCAADoQQAAEEIAACRCAIC8QwAAFUQAAKRDAAAkQgAAgUMAAAhCAIDFQwAA9kIAAOhBAADEQgAAFEMAAAxCAADUQgAAO0MAAApDAADgQQAA8EEAAANDAEAmRAAACEIAAL5CAAASRAAAAEIAABFDAEBQRA==
+            
+          
+        
+      
+    
+  
+  
+    
+      2685
+    
+  
+  7058
+  b76171188a63cfad075d3738a172b15f1f9e0c4c
+
diff -r 15c2dda543b3 -r 5d3626c86071 test-data/bsa.mzid
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/bsa.mzid	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,123 @@
+
+
+
+    
+    
+    
+
+
+    
+        
+            
+        
+    
+
+
+    
+        
+    
+    
+        YICDNQDTISSK
+        
+            
+        
+    
+    
+
+
+    
+        
+        
+    
+
+
+    
+        
+            
+        
+        
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+            
+        
+        
+            
+                
+            
+        
+        
+            
+                
+                    
+                
+            
+        
+        
+            
+            
+        
+        
+            
+        
+    
+
+
+    
+        
+            
+                
+            
+            
+                
+            
+        
+        
+            
+                
+            
+            
+                
+            
+        
+    
+    
+        
+            
+                
+                    
+                
+            
+            
+                
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                    
+                
+            
+        
+    
+
+
diff -r 15c2dda543b3 -r 5d3626c86071 tool-data/msgfplus_mods.loc.sample
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/msgfplus_mods.loc.sample	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,50 @@
+#This file lists the names of inbuilt chemical modifications accepted by msgfplus
+#Each entry consists of 4 tab separated fields like this
+#			
+#
+#Modification strings should conform to the standard MSGFPlus syntax with the following exception
+#The ModType field is overridden by the msgfplus_search.rb tool. In other words any of these mods
+#May be passed to the tool as a variable or fixed mod and the tool will substitute the appropriate ModType
+#value
+#
+#Standard MSGFPlus syntax is
+#
+# To input a modification, use the following command:
+# Mass or CompositionStr, Residues, ModType, Position, Name (all the five fields are required).
+# CompositionStr (C[Num]H[Num]N[Num]O[Num]S[Num]P[Num])
+# 	- C (Carbon), H (Hydrogen), N (Nitrogen), O (Oxygen), S (Sulfer) and P (Phosphorus) are allowed.
+# 	- Atom can be omitted. The sequence of atoms must be followed. 
+# 	- Negative numbers are allowed.
+# 	- E.g. C2H2O1 (valid), H2C1O1 (invalid) 
+# Mass can be used instead of CompositionStr. It is important to specify accurate masses (integer masses are insufficient).
+# 	- E.g. 15.994915 
+# Residues: affected amino acids (must be upper letters)
+# 	- Must be uppor letters or *
+# 	- Use * if this modification is applicable to any residue. 
+# 	- * should not be "anywhere" modification (e.g. "15.994915, *, opt, any, Oxidation" is not allowed.) 
+# 	- E.g. NQ, *
+# ModType: "fix" for fixed modifications, "opt" for variable modifications (case insensitive)
+# Position: position in the peptide where the modification can be attached. 
+# 	- One of the following five values should be used:
+# 	- any (anywhere), N-term (peptide N-term), C-term (peptide C-term), Prot-N-term (protein N-term), Prot-C-term (protein C-term) 
+# 	- Case insensitive
+# 	- "-" can be omitted
+# 	- E.g. any, Any, Prot-n-Term, ProtNTerm => all valid
+# Name: name of the modification (Unimod PSI-MS name)
+# 	- For proper mzIdentML output, this name should be the same as the Unimod PSI-MS name
+# 	- E.g. Phospho, Acetyl
+#C2H3N1O1,C,fix,any,Carbamidomethyl 		# Fixed Carbamidomethyl C
+# Variable Modifications (default: none)
+#O1,M,opt,any,Oxidation				# Oxidation M
+#15.994915,M,opt,any,Oxidation			# Oxidation M (mass is used instead of CompositionStr)
+#H-1N-1O1,NQ,opt,any,Deamidated			# Negative numbers are allowed.
+#C2H3NO,*,opt,N-term,Carbamidomethyl		# Variable Carbamidomethyl N-term
+#H-2O-1,E,opt,N-term,Pyro_glu			# Pyro-glu from E
+#H-3N-1,Q,opt,N-term,Pyro-glu			# Pyro-glu from Q
+#C2H2O,*,opt,Prot-N-term,Acetyl			# Acetylation Protein N-term
+#C2H2O1,K,opt,any,Acetyl			# Acetylation K
+#CH2,K,opt,any,Methy				# Methylation K
+#HO3P,STY,opt,any,Phospho			# Phosphorylation STY
+
+Carbamidomethyl C	carbamidomethyl_c_	C2H3N1O1,C,opt,any,Carbamidomethyl	carbamidomethyl_c_
+Oxidation M	oxidation_m_	O1,M,opt,any,Oxidation	oxidation_m_
\ No newline at end of file
diff -r 15c2dda543b3 -r 5d3626c86071 tool-data/pepxml_databases.loc.sample
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/pepxml_databases.loc.sample	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,13 @@
+#This file lists the names of protein databases installed locally in protk. 
+# These are used by omssa and x!tandem as well as the "mascot to pepxml" tool
+# In order to combine search results with Interprophet searches must be run against an identical database
+#
+# Entries should follow the be structured as follows
+# Display_name omssa_tandem_dbname dbkey
+#
+#
+Swissprot	spall_	spall	spall_
+Combined PlasmboDB (falciparum) and Swissprot Human	plasmodb_pfalciparum_sphuman_	plasmodb_pfalciparum_sphuman	plasmodb_pfalciparum_sphuman_
+Swissprot Human	sphuman_	sphuman	sphuman_
+Combined Swissprot/TRembl Human	sptrhuman_	sptrhuman	sptrhuman_
+Swissprot Mouse	spmouse_	spmouse	spmouse_
diff -r 15c2dda543b3 -r 5d3626c86071 tool_dependencies.xml
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml	Wed Mar 05 01:04:22 2014 -0500
@@ -0,0 +1,12 @@
+
+
+    
+         
+    
+    
+         
+    
+    
+         
+    
+