Context Navigation

init.py @ 2

リビジョン 2, 99.3 KB (コミッタ: hatakeyama, 14 年前)
import galaxy-central

行番号
1	"""
2	Classes encapsulating galaxy tools and tool configuration.
3	"""
4	import pkg_resources;
5
6	pkg_resources.require( "simplejson" )
7
8	import logging, os, string, sys, tempfile, glob, shutil, types, urllib
9	import simplejson
10	import binascii
11	from UserDict import DictMixin
12	from galaxy.util.odict import odict
13	from galaxy.util.bunch import Bunch
14	from galaxy.util.template import fill_template
15	from galaxy import util, jobs, model
16	from elementtree import ElementTree
17	from parameters import *
18	from parameters.grouping import *
19	from parameters.output import ToolOutputActionGroup
20	from parameters.validation import LateValidationError
21	from parameters.input_translation import ToolInputTranslator
22	from galaxy.util.expressions import ExpressionContext
23	from galaxy.tools.test import ToolTestBuilder
24	from galaxy.tools.actions import DefaultToolAction
25	from galaxy.tools.deps import DependencyManager
26	from galaxy.model import directory_hash_id
27	from galaxy.util.none_like import NoneDataset
28	from galaxy.datatypes import sniff
29	from cgi import FieldStorage
30	from galaxy.util.hash_util import *
31
32	log = logging.getLogger( __name__ )
33
34	class ToolNotFoundException( Exception ):
35	pass
36
37	class ToolBox( object ):
38	"""
39	Container for a collection of tools
40	"""
41
42	def __init__( self, config_filename, tool_root_dir, app ):
43	"""
44	Create a toolbox from the config file names by `config_filename`,
45	using `tool_root_directory` as the base directory for finding
46	individual tool config files.
47	"""
48	self.tools_by_id = {}
49	self.workflows_by_id = {}
50	self.tool_panel = odict()
51	self.tool_root_dir = tool_root_dir
52	self.app = app
53	self.init_dependency_manager()
54	try:
55	self.init_tools( config_filename )
56	except:
57	log.exception( "ToolBox error reading %s", config_filename )
58
59	def init_tools( self, config_filename ):
60	"""
61	Read the configuration file and load each tool.
62	The following tags are currently supported:
63	<toolbox>
64	<tool file="data_source/upload.xml"/> # tools outside sections
65	<label text="Basic Tools" id="basic_tools" /> # labels outside sections
66	<workflow id="529fd61ab1c6cc36" /> # workflows outside sections
67	<section name="Get Data" id="getext"> # sections
68	<tool file="data_source/biomart.xml" /> # tools inside sections
69	<label text="In Section" id="in_section" /> # labels inside sections
70	<workflow id="adb5f5c93f827949" /> # workflows inside sections
71	</section>
72	</toolbox>
73	"""
74	def load_tool( elem, panel_dict ):
75	try:
76	path = elem.get( "file" )
77	tool = self.load_tool( os.path.join( self.tool_root_dir, path ) )
78	self.tools_by_id[ tool.id ] = tool
79	key = 'tool_' + tool.id
80	panel_dict[ key ] = tool
81	log.debug( "Loaded tool: %s %s" % ( tool.id, tool.version ) )
82	except:
83	log.exception( "error reading tool from path: %s" % path )
84	def load_workflow( elem, panel_dict ):
85	try:
86	# TODO: should id be encoded?
87	workflow_id = elem.get( 'id' )
88	workflow = self.load_workflow( workflow_id )
89	self.workflows_by_id[ workflow_id ] = workflow
90	key = 'workflow_' + workflow_id
91	panel_dict[ key ] = workflow
92	log.debug( "Loaded workflow: %s %s" % ( workflow_id, workflow.name ) )
93	except:
94	log.exception( "error loading workflow: %s" % workflow_id )
95	def load_label( elem, panel_dict ):
96	label = ToolSectionLabel( elem )
97	key = 'label_' + label.id
98	panel_dict[ key ] = label
99	def load_section( elem, panel_dict ):
100	section = ToolSection( elem )
101	log.debug( "Loading section: %s" % section.name )
102	for section_elem in elem:
103	if section_elem.tag == 'tool':
104	load_tool( section_elem, section.elems )
105	elif section_elem.tag == 'workflow':
106	load_workflow( section_elem, section.elems )
107	elif section_elem.tag == 'label':
108	load_label( section_elem, section.elems )
109	key = 'section_' + section.id
110	panel_dict[ key ] = section
111
112	log.info("parsing the tool configuration")
113	tree = util.parse_xml( config_filename )
114	root = tree.getroot()
115	for elem in root:
116	if elem.tag == 'tool':
117	load_tool( elem, self.tool_panel )
118	elif elem.tag == 'workflow':
119	load_workflow( elem, self.tool_panel )
120	elif elem.tag == 'section' :
121	load_section( elem, self.tool_panel )
122	elif elem.tag == 'label':
123	load_label( elem, self.tool_panel )
124
125	def load_tool( self, config_file ):
126	"""
127	Load a single tool from the file named by `config_file` and return
128	an instance of `Tool`.
129	"""
130	# Parse XML configuration file and get the root element
131	tree = util.parse_xml( config_file )
132	root = tree.getroot()
133	# Allow specifying a different tool subclass to instantiate
134	if root.find( "type" ) is not None:
135	type_elem = root.find( "type" )
136	module = type_elem.get( 'module', 'galaxy.tools' )
137	cls = type_elem.get( 'class' )
138	mod = __import__( module, globals(), locals(), [cls])
139	ToolClass = getattr( mod, cls )
140	elif root.get( 'tool_type', None ) is not None:
141	ToolClass = tool_types.get( root.get( 'tool_type' ) )
142	else:
143	ToolClass = Tool
144	return ToolClass( config_file, root, self.app )
145
146	def reload( self, tool_id ):
147	"""
148	Attempt to reload the tool identified by 'tool_id', if successful
149	replace the old tool.
150	"""
151	if tool_id not in self.tools_by_id:
152	raise ToolNotFoundException( "No tool with id %s" % tool_id )
153	old_tool = self.tools_by_id[ tool_id ]
154	new_tool = self.load_tool( old_tool.config_file )
155	# Replace old_tool with new_tool in self.tool_panel
156	tool_key = 'tool_' + tool_id
157	for key, val in self.tool_panel.items():
158	if key == tool_key:
159	self.tool_panel[ key ] = new_tool
160	break
161	elif key.startswith( 'section' ):
162	section = val
163	for section_key, section_val in section.elems.items():
164	if section_key == tool_key:
165	self.tool_panel[ key ].elems[ section_key ] = new_tool
166	break
167	self.tools_by_id[ tool_id ] = new_tool
168	log.debug( "Reloaded tool %s %s" %( old_tool.id, old_tool.version ) )
169
170	def load_workflow( self, workflow_id ):
171	"""
172	Return an instance of 'Workflow' identified by `id`,
173	which is encoded in the tool panel.
174	"""
175	id = self.app.security.decode_id( workflow_id )
176	stored = self.app.model.context.query( self.app.model.StoredWorkflow ).get( id )
177	return stored.latest_workflow
178
179	def init_dependency_manager( self ):
180	self.dependency_manager = None
181	if self.app.config.use_tool_dependencies:
182	self.dependency_manager = DependencyManager( [ self.app.config.tool_dependency_dir ] )
183
184	class ToolSection( object ):
185	"""
186	A group of tools with similar type/purpose that will be displayed as a
187	group in the user interface.
188	"""
189	def __init__( self, elem ):
190	self.name = elem.get( "name" )
191	self.id = elem.get( "id" )
192	self.version = elem.get( "version" )
193	self.elems = odict()
194
195	class ToolSectionLabel( object ):
196	"""
197	A label for a set of tools that can be displayed above groups of tools
198	and sections in the user interface
199	"""
200	def __init__( self, elem ):
201	self.text = elem.get( "text" )
202	self.id = elem.get( "id" )
203	self.version = elem.get( "version" )
204
205	class DefaultToolState( object ):
206	"""
207	Keeps track of the state of a users interaction with a tool between
208	requests. The default tool state keeps track of the current page (for
209	multipage "wizard" tools) and the values of all parameters.
210	"""
211	def __init__( self ):
212	self.page = 0
213	self.inputs = None
214	def encode( self, tool, app, secure=True ):
215	"""
216	Convert the data to a string
217	"""
218	# Convert parameters to a dictionary of strings, and save curent
219	# page in that dict
220	value = params_to_strings( tool.inputs, self.inputs, app )
221	value["__page__"] = self.page
222	value = simplejson.dumps( value )
223	# Make it secure
224	if secure:
225	a = hmac_new( app.config.tool_secret, value )
226	b = binascii.hexlify( value )
227	return "%s:%s" % ( a, b )
228	else:
229	return value
230	def decode( self, value, tool, app, secure=True ):
231	"""
232	Restore the state from a string
233	"""
234	if secure:
235	# Extract and verify hash
236	a, b = value.split( ":" )
237	value = binascii.unhexlify( b )
238	test = hmac_new( app.config.tool_secret, value )
239	assert a == test
240	# Restore from string
241	values = json_fix( simplejson.loads( value ) )
242	self.page = values.pop( "__page__" )
243	self.inputs = params_from_strings( tool.inputs, values, app, ignore_errors=True )
244
245	class ToolOutput( object ):
246	"""
247	Represents an output datasets produced by a tool. For backward
248	compatibility this behaves as if it were the tuple:
249	(format, metadata_source, parent)
250	"""
251
252	def __init__( self, name, format=None, metadata_source=None,
253	parent=None, label=None, filters = None, actions = None ):
254	self.name = name
255	self.format = format
256	self.metadata_source = metadata_source
257	self.parent = parent
258	self.label = label
259	self.filters = filters or []
260	self.actions = actions
261
262	# Tuple emulation
263
264	def __len__( self ):
265	return 3
266
267	def __getitem__( self, index ):
268	if index == 0:
269	return self.format
270	elif index == 1:
271	return self.metadata_source
272	elif index == 2:
273	return self.parent
274	else:
275	raise IndexError( index )
276
277	def __iter__( self ):
278	return iter( ( self.format, self.metadata_source, self.parent ) )
279
280	class ToolRequirement( object ):
281	"""
282	Represents an external requirement that must be available for the tool to
283	run (for example, a program, package, or library). Requirements can
284	optionally assert a specific version
285	"""
286	def __init__( self ):
287	self.name = None
288	self.type = None
289	self.version = None
290
291	class Tool:
292	"""
293	Represents a computational tool that can be executed through Galaxy.
294	"""
295
296	tool_type = 'default'
297
298	def __init__( self, config_file, root, app ):
299	"""
300	Load a tool from the config named by `config_file`
301	"""
302	# Determine the full path of the directory where the tool config is
303	self.config_file = config_file
304	self.tool_dir = os.path.dirname( config_file )
305	self.app = app
306	# Parse XML element containing configuration
307	self.parse( root )
308
309	@property
310	def sa_session( self ):
311	"""
312	Returns a SQLAlchemy session
313	"""
314	return self.app.model.context
315
316	def parse( self, root ):
317	"""
318	Read tool configuration from the element `root` and fill in `self`.
319	"""
320	# Get the (user visible) name of the tool
321	self.name = root.get( "name" )
322	if not self.name:
323	raise Exception, "Missing tool 'name'"
324	# Get the UNIQUE id for the tool
325	# TODO: can this be generated automatically?
326	self.id = root.get( "id" )
327	if not self.id:
328	raise Exception, "Missing tool 'id'"
329	self.version = root.get( "version" )
330	if not self.version:
331	# For backward compatibility, some tools may not have versions yet.
332	self.version = "1.0.0"
333	# Support multi-byte tools
334	self.is_multi_byte = util.string_as_bool( root.get( "is_multi_byte", False ) )
335	# Force history to fully refresh after job execution for this tool.
336	# Useful i.e. when an indeterminate number of outputs are created by
337	# a tool.
338	self.force_history_refresh = util.string_as_bool( root.get( 'force_history_refresh', 'False' ) )
339	# Load input translator, used by datasource tools to change
340	# names/values of incoming parameters
341	self.input_translator = root.find( "request_param_translation" )
342	if self.input_translator:
343	self.input_translator = ToolInputTranslator.from_element( self.input_translator )
344	# Command line (template). Optional for tools that do not invoke a
345	# local program
346	command = root.find("command")
347	if command is not None and command.text is not None:
348	self.command = command.text.lstrip() # get rid of leading whitespace
349	interpreter = command.get("interpreter")
350	if interpreter:
351	# TODO: path munging for cluster/dataset server relocatability
352	executable = self.command.split()[0]
353	abs_executable = os.path.abspath(os.path.join(self.tool_dir, executable))
354	self.command = self.command.replace(executable, abs_executable, 1)
355	self.command = interpreter + " " + self.command
356	else:
357	self.command = ''
358	# Parameters used to build URL for redirection to external app
359	redirect_url_params = root.find( "redirect_url_params" )
360	if redirect_url_params is not None and redirect_url_params.text is not None:
361	# get rid of leading / trailing white space
362	redirect_url_params = redirect_url_params.text.strip()
363	# Replace remaining white space with something we can safely split on later
364	# when we are building the params
365	self.redirect_url_params = redirect_url_params.replace( ' ', '^' )
366	else:
367	self.redirect_url_params = ''
368	# Short description of the tool
369	self.description = util.xml_text(root, "description")
370	# Job runner
371	if self.app.config.start_job_runners is None:
372	# Jobs are always local regardless of tool config if no additional
373	# runners are started
374	self.job_runner = "local:///"
375	else:
376	# Set job runner to the cluster default
377	self.job_runner = self.app.config.default_cluster_job_runner
378	for tup in self.app.config.tool_runners:
379	if tup[0] == self.id.lower():
380	self.job_runner = tup[1]
381	break
382	# Is this a 'hidden' tool (hidden in tool menu)
383	self.hidden = util.xml_text(root, "hidden")
384	if self.hidden: self.hidden = util.string_as_bool(self.hidden)
385	# Load any tool specific code (optional) Edit: INS 5/29/2007,
386	# allow code files to have access to the individual tool's
387	# "module" if it has one. Allows us to reuse code files, etc.
388	self.code_namespace = dict()
389	self.hook_map = {}
390	for code_elem in root.findall("code"):
391	for hook_elem in code_elem.findall("hook"):
392	for key, value in hook_elem.items():
393	# map hook to function
394	self.hook_map[key]=value
395	file_name = code_elem.get("file")
396	code_path = os.path.join( self.tool_dir, file_name )
397	execfile( code_path, self.code_namespace )
398	# Load any tool specific options (optional)
399	self.options = dict( sanitize=True, refresh=False )
400	for option_elem in root.findall("options"):
401	for option, value in self.options.copy().items():
402	if isinstance(value, type(False)):
403	self.options[option] = util.string_as_bool(option_elem.get(option, str(value)))
404	else:
405	self.options[option] = option_elem.get(option, str(value))
406	self.options = Bunch(** self.options)
407	# Parse tool inputs (if there are any required)
408	self.parse_inputs( root )
409	# Parse tool help
410	self.parse_help( root )
411	# Description of outputs produced by an invocation of the tool
412	self.parse_outputs( root )
413	# Any extra generated config files for the tool
414	self.config_files = []
415	conf_parent_elem = root.find("configfiles")
416	if conf_parent_elem:
417	for conf_elem in conf_parent_elem.findall( "configfile" ):
418	name = conf_elem.get( "name" )
419	filename = conf_elem.get( "filename", None )
420	text = conf_elem.text
421	self.config_files.append( ( name, filename, text ) )
422	# Action
423	action_elem = root.find( "action" )
424	if action_elem is None:
425	self.tool_action = DefaultToolAction()
426	else:
427	module = action_elem.get( 'module' )
428	cls = action_elem.get( 'class' )
429	mod = __import__( module, globals(), locals(), [cls])
430	self.tool_action = getattr( mod, cls )()
431	# User interface hints
432	self.uihints = {}
433	uihints_elem = root.find( "uihints" )
434	if uihints_elem is not None:
435	for key, value in uihints_elem.attrib.iteritems():
436	self.uihints[ key ] = value
437	# Tests
438	tests_elem = root.find( "tests" )
439	if tests_elem:
440	try:
441	self.parse_tests( tests_elem )
442	except:
443	log.exception( "Failed to parse tool tests" )
444	else:
445	self.tests = None
446	# Requirements (dependencies)
447	self.requirements = []
448	requirements_elem = root.find( "requirements" )
449	if requirements_elem:
450	self.parse_requirements( requirements_elem )
451	# Determine if this tool can be used in workflows
452	self.is_workflow_compatible = self.check_workflow_compatible()
453
454	def parse_inputs( self, root ):
455	"""
456	Parse the "<inputs>" element and create appropriate `ToolParameter`s.
457	This implementation supports multiple pages and grouping constructs.
458	"""
459	# Load parameters (optional)
460	input_elem = root.find("inputs")
461	if input_elem:
462	# Handle properties of the input form
463	self.check_values = util.string_as_bool( input_elem.get("check_values", "true") )
464	self.nginx_upload = util.string_as_bool( input_elem.get( "nginx_upload", "false" ) )
465	self.action = input_elem.get( 'action', '/tool_runner/index' )
466	# If we have an nginx upload, save the action as a tuple instead of
467	# a string. The actual action needs to get url_for run to add any
468	# prefixes, and we want to avoid adding the prefix to the
469	# nginx_upload_path. This logic is handled in the tool_form.mako
470	# template.
471	if self.nginx_upload and self.app.config.nginx_upload_path:
472	if '?' in urllib.unquote_plus( self.action ):
473	raise Exception( 'URL parameters in a non-default tool action can not be used ' \
474	'in conjunction with nginx upload. Please convert them to ' \
475	'hidden POST parameters' )
476	self.action = (self.app.config.nginx_upload_path + '?nginx_redir=',
477	urllib.unquote_plus(self.action))
478	self.target = input_elem.get( "target", "galaxy_main" )
479	self.method = input_elem.get( "method", "post" )
480	# Parse the actual parameters
481	self.inputs = odict()
482	self.inputs_by_page = list()
483	self.display_by_page = list()
484	enctypes = set()
485	# Handle multiple page case
486	pages = input_elem.findall( "page" )
487	for page in ( pages or [ input_elem ] ):
488	display, inputs = self.parse_input_page( page, enctypes )
489	self.inputs_by_page.append( inputs )
490	self.inputs.update( inputs )
491	self.display_by_page.append( display )
492	self.display = self.display_by_page[0]
493	self.npages = len( self.inputs_by_page )
494	self.last_page = len( self.inputs_by_page ) - 1
495	self.has_multiple_pages = bool( self.last_page )
496	# Determine the needed enctype for the form
497	if len( enctypes ) == 0:
498	self.enctype = "application/x-www-form-urlencoded"
499	elif len( enctypes ) == 1:
500	self.enctype = enctypes.pop()
501	else:
502	raise Exception, "Conflicting required enctypes: %s" % str( enctypes )
503	# Check if the tool either has no parameters or only hidden (and
504	# thus hardcoded) parameters. FIXME: hidden parameters aren't
505	# parameters at all really, and should be passed in a different
506	# way, making this check easier.
507	self.input_required = False
508	for param in self.inputs.values():
509	if not isinstance( param, ( HiddenToolParameter, BaseURLToolParameter ) ):
510	self.input_required = True
511	break
512
513	def parse_help( self, root ):
514	"""
515	Parse the help text for the tool. Formatted in reStructuredText.
516	This implementation supports multiple pages.
517	"""
518	# TODO: Allow raw HTML or an external link.
519	self.help = root.find("help")
520	self.help_by_page = list()
521	help_header = ""
522	help_footer = ""
523	if self.help is not None:
524	help_pages = self.help.findall( "page" )
525	help_header = self.help.text
526	try:
527	self.help = util.rst_to_html(self.help.text)
528	except:
529	log.exception( "error in help for tool %s" % self.name )
530	# Multiple help page case
531	if help_pages:
532	for help_page in help_pages:
533	self.help_by_page.append( help_page.text )
534	help_footer = help_footer + help_page.tail
535	# Each page has to rendered all-together because of backreferences allowed by rst
536	try:
537	self.help_by_page = [ util.rst_to_html( help_header + x + help_footer )
538	for x in self.help_by_page ]
539	except:
540	log.exception( "error in multi-page help for tool %s" % self.name )
541	# Pad out help pages to match npages ... could this be done better?
542	while len( self.help_by_page ) < self.npages:
543	self.help_by_page.append( self.help )
544
545	def parse_outputs( self, root ):
546	"""
547	Parse <outputs> elements and fill in self.outputs (keyed by name)
548	"""
549	self.outputs = odict()
550	out_elem = root.find("outputs")
551	if not out_elem:
552	return
553	for data_elem in out_elem.findall("data"):
554	output = ToolOutput( data_elem.get("name") )
555	output.format = data_elem.get("format", "data")
556	output.change_format = data_elem.findall("change_format")
557	output.metadata_source = data_elem.get("metadata_source", "")
558	output.parent = data_elem.get("parent", None)
559	output.label = util.xml_text( data_elem, "label" )
560	output.count = int( data_elem.get("count", 1) )
561	output.filters = data_elem.findall( 'filter' )
562	output.tool = self
563	output.actions = ToolOutputActionGroup( output, data_elem.find( 'actions' ) )
564	self.outputs[ output.name ] = output
565
566	def parse_tests( self, tests_elem ):
567	"""
568	Parse any "<test>" elements, create a `ToolTestBuilder` for each and
569	store in `self.tests`.
570	"""
571	self.tests = []
572	# Composite datasets need a unique name: each test occurs in a fresh
573	# history, but we'll keep it unique per set of tests
574	composite_data_names_counter = 0
575	for i, test_elem in enumerate( tests_elem.findall( 'test' ) ):
576	name = test_elem.get( 'name', 'Test-%d' % (i+1) )
577	maxseconds = int( test_elem.get( 'maxseconds', '120' ) )
578	test = ToolTestBuilder( self, name, maxseconds )
579	try:
580	for param_elem in test_elem.findall( "param" ):
581	attrib = dict( param_elem.attrib )
582	if 'values' in attrib:
583	value = attrib[ 'values' ].split( ',' )
584	elif 'value' in attrib:
585	value = attrib['value']
586	else:
587	value = None
588	attrib['children'] = list( param_elem.getchildren() )
589	if attrib['children']:
590	# At this time, we can assume having children only
591	# occurs on DataToolParameter test items but this could
592	# change and would cause the below parsing to change
593	# based upon differences in children items
594	attrib['metadata'] = []
595	attrib['composite_data'] = []
596	attrib['edit_attributes'] = []
597	# Composite datasets need to be renamed uniquely
598	composite_data_name = None
599	for child in attrib['children']:
600	if child.tag == 'composite_data':
601	attrib['composite_data'].append( child )
602	if composite_data_name is None:
603	# Generate a unique name; each test uses a
604	# fresh history
605	composite_data_name = '_COMPOSITE_RENAMED_%i_' \
606	% ( composite_data_names_counter )
607	composite_data_names_counter += 1
608	elif child.tag == 'metadata':
609	attrib['metadata'].append( child )
610	elif child.tag == 'metadata':
611	attrib['metadata'].append( child )
612	elif child.tag == 'edit_attributes':
613	attrib['edit_attributes'].append( child )
614	if composite_data_name:
615	# Composite datasets need implicit renaming;
616	# inserted at front of list so explicit declarations
617	# take precedence
618	attrib['edit_attributes'].insert( 0, { 'type': 'name', 'value': composite_data_name } )
619	test.add_param( attrib.pop( 'name' ), value, attrib )
620	for output_elem in test_elem.findall( "output" ):
621	attrib = dict( output_elem.attrib )
622	name = attrib.pop( 'name', None )
623	if name is None:
624	raise Exception( "Test output does not have a 'name'" )
625	file = attrib.pop( 'file', None )
626	if file is None:
627	raise Exception( "Test output does not have a 'file'")
628	attributes = {}
629	# Method of comparison
630	attributes['compare'] = attrib.pop( 'compare', 'diff' ).lower()
631	# Number of lines to allow to vary in logs (for dates, etc)
632	attributes['lines_diff'] = int( attrib.pop( 'lines_diff', '0' ) )
633	# Allow a file size to vary if sim_size compare
634	attributes['delta'] = int( attrib.pop( 'delta', '10000' ) )
635	attributes['sort'] = util.string_as_bool( attrib.pop( 'sort', False ) )
636	attributes['extra_files'] = []
637	for extra in output_elem.findall( 'extra_files' ):
638	# File or directory, when directory, compare basename
639	# by basename
640	extra_type = extra.get( 'type', 'file' )
641	extra_name = extra.get( 'name', None )
642	assert extra_type == 'directory' or extra_name is not None, \
643	'extra_files type (%s) requires a name attribute' % extra_type
644	extra_value = extra.get( 'value', None )
645	assert extra_value is not None, 'extra_files requires a value attribute'
646	extra_attributes = {}
647	extra_attributes['compare'] = extra.get( 'compare', 'diff' ).lower()
648	extra_attributes['delta'] = extra.get( 'delta', '0' )
649	extra_attributes['lines_diff'] = int( extra.get( 'lines_diff', '0' ) )
650	extra_attributes['sort'] = util.string_as_bool( extra.get( 'sort', False ) )
651	attributes['extra_files'].append( ( extra_type, extra_value, extra_name, extra_attributes ) )
652	test.add_output( name, file, attributes )
653	except Exception, e:
654	test.error = True
655	test.exception = e
656	self.tests.append( test )
657
658	def parse_input_page( self, input_elem, enctypes ):
659	"""
660	Parse a page of inputs. This basically just calls 'parse_input_elem',
661	but it also deals with possible 'display' elements which are supported
662	only at the top/page level (not in groups).
663	"""
664	inputs = self.parse_input_elem( input_elem, enctypes )
665	# Display
666	display_elem = input_elem.find("display")
667	if display_elem is not None:
668	display = util.xml_to_string(display_elem)
669	else:
670	display = None
671	return display, inputs
672
673	def parse_input_elem( self, parent_elem, enctypes, context=None ):
674	"""
675	Parse a parent element whose children are inputs -- these could be
676	groups (repeat, conditional) or param elements. Groups will be parsed
677	recursively.
678	"""
679	rval = odict()
680	context = ExpressionContext( rval, context )
681	for elem in parent_elem:
682	# Repeat group
683	if elem.tag == "repeat":
684	group = Repeat()
685	group.name = elem.get( "name" )
686	group.title = elem.get( "title" )
687	group.inputs = self.parse_input_elem( elem, enctypes, context )
688	group.default = int( elem.get( "default", 0 ) )
689	group.min = int( elem.get( "min", 0 ) )
690	# Use float instead of int so that 'inf' can be used for no max
691	group.max = float( elem.get( "max", "inf" ) )
692	assert group.min <= group.max, \
693	ValueError( "Min repeat count must be less-than-or-equal to the max." )
694	# Force default to be within min-max range
695	group.default = min( max( group.default, group.min ), group.max )
696	rval[group.name] = group
697	elif elem.tag == "conditional":
698	group = Conditional()
699	group.name = elem.get( "name" )
700	group.value_ref = elem.get( 'value_ref', None )
701	group.value_ref_in_group = util.string_as_bool( elem.get( 'value_ref_in_group', 'True' ) )
702	value_from = elem.get( "value_from" )
703	if value_from:
704	value_from = value_from.split( ':' )
705	group.value_from = locals().get( value_from[0] )
706	group.test_param = rval[ group.value_ref ]
707	group.test_param.refresh_on_change = True
708	for attr in value_from[1].split( '.' ):
709	group.value_from = getattr( group.value_from, attr )
710	for case_value, case_inputs in group.value_from( context, group, self ).iteritems():
711	case = ConditionalWhen()
712	case.value = case_value
713	if case_inputs:
714	case.inputs = self.parse_input_elem(
715	ElementTree.XML( "<when>%s</when>" % case_inputs ), enctypes, context )
716	else:
717	case.inputs = {}
718	group.cases.append( case )
719	else:
720	# Should have one child "input" which determines the case
721	input_elem = elem.find( "param" )
722	assert input_elem is not None, "<conditional> must have a child <param>"
723	group.test_param = self.parse_param_elem( input_elem, enctypes, context )
724	# Must refresh when test_param changes
725	group.test_param.refresh_on_change = True
726	# And a set of possible cases
727	for case_elem in elem.findall( "when" ):
728	case = ConditionalWhen()
729	case.value = case_elem.get( "value" )
730	case.inputs = self.parse_input_elem( case_elem, enctypes, context )
731	group.cases.append( case )
732	rval[group.name] = group
733	elif elem.tag == "upload_dataset":
734	group = UploadDataset()
735	group.name = elem.get( "name" )
736	group.title = elem.get( "title" )
737	group.file_type_name = elem.get( 'file_type_name', group.file_type_name )
738	group.default_file_type = elem.get( 'default_file_type', group.default_file_type )
739	group.metadata_ref = elem.get( 'metadata_ref', group.metadata_ref )
740	rval[ group.file_type_name ].refresh_on_change = True
741	rval[ group.file_type_name ].refresh_on_change_values = \
742	self.app.datatypes_registry.get_composite_extensions()
743	group.inputs = self.parse_input_elem( elem, enctypes, context )
744	rval[ group.name ] = group
745	elif elem.tag == "param":
746	param = self.parse_param_elem( elem, enctypes, context )
747	rval[param.name] = param
748	return rval
749
750	def parse_param_elem( self, input_elem, enctypes, context ):
751	"""
752	Parse a single "<param>" element and return a ToolParameter instance.
753	Also, if the parameter has a 'required_enctype' add it to the set
754	enctypes.
755	"""
756	param = ToolParameter.build( self, input_elem )
757	param_enctype = param.get_required_enctype()
758	if param_enctype:
759	enctypes.add( param_enctype )
760	# If parameter depends on any other paramters, we must refresh the
761	# form when it changes
762	for name in param.get_dependencies():
763	context[ name ].refresh_on_change = True
764	return param
765
766	def parse_requirements( self, requirements_elem ):
767	"""
768	Parse each requirement from the <requirements> element and add to
769	self.requirements
770	"""
771	for requirement_elem in requirements_elem.findall( 'requirement' ):
772	requirement = ToolRequirement()
773	requirement.name = util.xml_text( requirement_elem )
774	requirement.type = requirement_elem.get( "type", "package" )
775	requirement.version = requirement_elem.get( "version" )
776	self.requirements.append( requirement )
777
778	def check_workflow_compatible( self ):
779	"""
780	Determine if a tool can be used in workflows. External tools and the
781	upload tool are currently not supported by workflows.
782	"""
783	# Multiple page tools are not supported -- we're eliminating most
784	# of these anyway
785	if self.has_multiple_pages:
786	return False
787	# This is probably the best bet for detecting external web tools
788	# right now
789	if self.action != "/tool_runner/index":
790	return False
791	# HACK: upload is (as always) a special case becuase file parameters
792	# can't be persisted.
793	if self.id == "upload1":
794	return False
795	# TODO: Anyway to capture tools that dynamically change their own
796	# outputs?
797	return True
798
799	def new_state( self, trans, all_pages=False ):
800	"""
801	Create a new `DefaultToolState` for this tool. It will be initialized
802	with default values for inputs.
803
804	Only inputs on the first page will be initialized unless `all_pages` is
805	True, in which case all inputs regardless of page are initialized.
806	"""
807	state = DefaultToolState()
808	state.inputs = {}
809	if all_pages:
810	inputs = self.inputs
811	else:
812	inputs = self.inputs_by_page[ 0 ]
813	self.fill_in_new_state( trans, inputs, state.inputs )
814	return state
815
816	def fill_in_new_state( self, trans, inputs, state, context=None ):
817	"""
818	Fill in a tool state dictionary with default values for all parameters
819	in the dictionary `inputs`. Grouping elements are filled in recursively.
820	"""
821	context = ExpressionContext( state, context )
822	for input in inputs.itervalues():
823	state[ input.name ] = input.get_initial_value( trans, context )
824
825	def get_param_html_map( self, trans, page=0, other_values={} ):
826	"""
827	Return a dictionary containing the HTML representation of each
828	parameter. This is used for rendering display elements. It is
829	currently not compatible with grouping constructs.
830
831	NOTE: This should be considered deprecated, it is only used for tools
832	with `display` elements. These should be eliminated.
833	"""
834	rval = dict()
835	for key, param in self.inputs_by_page[page].iteritems():
836	if not isinstance( param, ToolParameter ):
837	raise Exception( "'get_param_html_map' only supported for simple paramters" )
838	rval[key] = param.get_html( trans, other_values=other_values )
839	return rval
840
841	def get_param( self, key ):
842	"""
843	Returns the parameter named `key` or None if there is no such
844	parameter.
845	"""
846	return self.inputs.get( key, None )
847
848	def get_hook(self, name):
849	"""
850	Returns an object from the code file referenced by `code_namespace`
851	(this will normally be a callable object)
852	"""
853	if self.code_namespace:
854	# Try to look up hook in self.hook_map, otherwise resort to default
855	if name in self.hook_map and self.hook_map[name] in self.code_namespace:
856	return self.code_namespace[self.hook_map[name]]
857	elif name in self.code_namespace:
858	return self.code_namespace[name]
859	return None
860
861	def visit_inputs( self, value, callback ):
862	"""
863	Call the function `callback` on each parameter of this tool. Visits
864	grouping parameters recursively and constructs unique prefixes for
865	each nested set of parameters. The callback method is then called as:
866
867	`callback( level_prefix, parameter, parameter_value )`
868	"""
869	# HACK: Yet another hack around check_values -- WHY HERE?
870	if not self.check_values:
871	return
872	for input in self.inputs.itervalues():
873	if isinstance( input, ToolParameter ):
874	callback( "", input, value[input.name] )
875	else:
876	input.visit_inputs( "", value[input.name], callback )
877
878	def handle_input( self, trans, incoming ):
879	"""
880	Process incoming parameters for this tool from the dict `incoming`,
881	update the tool state (or create if none existed), and either return
882	to the form or execute the tool (only if 'execute' was clicked and
883	there were no errors).
884	"""
885	# Get the state or create if not found
886	if "tool_state" in incoming:
887	encoded_state = util.string_to_object( incoming["tool_state"] )
888	state = DefaultToolState()
889	state.decode( encoded_state, self, trans.app )
890	else:
891	state = self.new_state( trans )
892	# This feels a bit like a hack. It allows forcing full processing
893	# of inputs even when there is no state in the incoming dictionary
894	# by providing either 'runtool_btn' (the name of the submit button
895	# on the standard run form) or "URL" (a parameter provided by
896	# external data source tools).
897	if "runtool_btn" not in incoming and "URL" not in incoming:
898	return "tool_form.mako", dict( errors={}, tool_state=state, param_values={}, incoming={} )
899	# Process incoming data
900	if not( self.check_values ):
901	# If `self.check_values` is false we don't do any checking or
902	# processing on input parameters. This is used to pass raw values
903	# through to/from external sites. FIXME: This should be handled
904	# more cleanly, there is no reason why external sites need to
905	# post back to the same URL that the tool interface uses.
906	errors = {}
907	params = incoming
908	else:
909	# Update state for all inputs on the current page taking new
910	# values from `incoming`.
911	errors = self.update_state( trans, self.inputs_by_page[state.page], state.inputs, incoming )
912	# If the tool provides a `validate_input` hook, call it.
913	validate_input = self.get_hook( 'validate_input' )
914	if validate_input:
915	validate_input( trans, errors, state.inputs, self.inputs_by_page[state.page] )
916	params = state.inputs
917	# Did the user actually click next / execute or is this just
918	# a refresh?
919	if 'runtool_btn' in incoming or 'URL' in incoming or 'ajax_upload' in incoming:
920	# If there were errors, we stay on the same page and display
921	# error messages
922	if errors:
923	error_message = "One or more errors were found in the input you provided. The specific errors are marked below."
924	return "tool_form.mako", dict( errors=errors, tool_state=state, incoming=incoming, error_message=error_message )
925	# If we've completed the last page we can execute the tool
926	elif state.page == self.last_page:
927	_, out_data = self.execute( trans, incoming=params )
928	try:
929	assert isinstance( out_data, odict )
930	return 'tool_executed.mako', dict( out_data=out_data )
931	except:
932	return 'message.mako', dict( status='error', message='odict not returned from tool execution', refresh_frames=[] )
933	# Otherwise move on to the next page
934	else:
935	state.page += 1
936	# Fill in the default values for the next page
937	self.fill_in_new_state( trans, self.inputs_by_page[ state.page ], state.inputs )
938	return 'tool_form.mako', dict( errors=errors, tool_state=state )
939	else:
940	try:
941	self.find_fieldstorage( state.inputs )
942	except InterruptedUpload:
943	# If inputs contain a file it won't persist. Most likely this
944	# is an interrupted upload. We should probably find a more
945	# standard method of determining an incomplete POST.
946	return self.handle_interrupted( trans, state.inputs )
947	except:
948	pass
949	# Just a refresh, render the form with updated state and errors.
950	return 'tool_form.mako', dict( errors=errors, tool_state=state )
951
952	def find_fieldstorage( self, x ):
953	if isinstance( x, FieldStorage ):
954	raise InterruptedUpload( None )
955	elif type( x ) is types.DictType:
956	[ self.find_fieldstorage( y ) for y in x.values() ]
957	elif type( x ) is types.ListType:
958	[ self.find_fieldstorage( y ) for y in x ]
959
960	def handle_interrupted( self, trans, inputs ):
961	"""
962	Upon handling inputs, if it appears that we have received an incomplete
963	form, do some cleanup or anything else deemed necessary. Currently
964	this is only likely during file uploads, but this method could be
965	generalized and a method standardized for handling other tools.
966	"""
967	# If the async upload tool has uploading datasets, we need to error them.
968	if 'async_datasets' in inputs and inputs['async_datasets'] not in [ 'None', '', None ]:
969	for id in inputs['async_datasets'].split(','):
970	try:
971	data = self.sa_session.query( trans.model.HistoryDatasetAssociation ).get( int( id ) )
972	except:
973	log.exception( 'Unable to load precreated dataset (%s) sent in upload form' % id )
974	continue
975	if trans.user is None and trans.galaxy_session.current_history != data.history:
976	log.error( 'Got a precreated dataset (%s) but it does not belong to anonymous user\'s current session (%s)'
977	% ( data.id, trans.galaxy_session.id ) )
978	elif data.history.user != trans.user:
979	log.error( 'Got a precreated dataset (%s) but it does not belong to current user (%s)'
980	% ( data.id, trans.user.id ) )
981	else:
982	data.state = data.states.ERROR
983	data.info = 'Upload of this dataset was interrupted. Please try uploading again or'
984	self.sa_session.add( data )
985	self.sa_session.flush()
986	# It's unlikely the user will ever see this.
987	return 'message.mako', dict( status='error',
988	message='Your upload was interrupted. If this was uninentional, please retry it.',
989	refresh_frames=[], cont=None )
990
991	def update_state( self, trans, inputs, state, incoming, prefix="", context=None,
992	update_only=False, old_errors={}, item_callback=None ):
993	"""
994	Update the tool state in `state` using the user input in `incoming`.
995	This is designed to be called recursively: `inputs` contains the
996	set of inputs being processed, and `prefix` specifies a prefix to
997	add to the name of each input to extract it's value from `incoming`.
998
999	If `update_only` is True, values that are not in `incoming` will
1000	not be modified. In this case `old_errors` can be provided, and any
1001	errors for parameters which were not updated will be preserved.
1002	"""
1003	errors = dict()
1004	# Push this level onto the context stack
1005	context = ExpressionContext( state, context )
1006	# Iterate inputs and update (recursively)
1007	for input in inputs.itervalues():
1008	key = prefix + input.name
1009	if isinstance( input, Repeat ):
1010	group_state = state[input.name]
1011	# Create list of empty errors for each previously existing state
1012	group_errors = [ {} for i in range( len( group_state ) ) ]
1013	group_old_errors = old_errors.get( input.name, None )
1014	any_group_errors = False
1015	# Check any removals before updating state -- only one
1016	# removal can be performed, others will be ignored
1017	for i, rep_state in enumerate( group_state ):
1018	rep_index = rep_state['__index__']
1019	if key + "_" + str(rep_index) + "_remove" in incoming:
1020	if len( group_state ) > input.min:
1021	del group_state[i]
1022	del group_errors[i]
1023	if group_old_errors:
1024	del group_old_errors[i]
1025	break
1026	else:
1027	group_errors[i] = { '__index__': 'Cannot remove repeat (min size=%i).' % input.min }
1028	any_group_errors = True
1029	# Only need to find one that can't be removed due to size, since only
1030	# one removal is processed at # a time anyway
1031	break
1032	# Update state
1033	max_index = -1
1034	for i, rep_state in enumerate( group_state ):
1035	rep_index = rep_state['__index__']
1036	max_index = max( max_index, rep_index )
1037	rep_prefix = "%s_%d\|" % ( key, rep_index )
1038	if group_old_errors:
1039	rep_old_errors = group_old_errors[i]
1040	else:
1041	rep_old_errors = {}
1042	rep_errors = self.update_state( trans,
1043	input.inputs,
1044	rep_state,
1045	incoming,
1046	prefix=rep_prefix,
1047	context=context,
1048	update_only=update_only,
1049	old_errors=rep_old_errors,
1050	item_callback=item_callback )
1051	if rep_errors:
1052	any_group_errors = True
1053	group_errors[i].update( rep_errors )
1054	# Check for addition
1055	if key + "_add" in incoming:
1056	if len( group_state ) < input.max:
1057	new_state = {}
1058	new_state['__index__'] = max_index + 1
1059	self.fill_in_new_state( trans, input.inputs, new_state, context )
1060	group_state.append( new_state )
1061	group_errors.append( {} )
1062	else:
1063	group_errors[-1] = { '__index__': 'Cannot add repeat (max size=%i).' % input.max }
1064	any_group_errors = True
1065	# Were there any errors for any repetition?
1066	if any_group_errors:
1067	errors[input.name] = group_errors
1068	elif isinstance( input, Conditional ):
1069	group_state = state[input.name]
1070	group_old_errors = old_errors.get( input.name, {} )
1071	old_current_case = group_state['__current_case__']
1072	group_prefix = "%s\|" % ( key )
1073	# Deal with the 'test' element and see if it's value changed
1074	if input.value_ref and not input.value_ref_in_group:
1075	# We are referencing an existent parameter, which is not
1076	# part of this group
1077	test_param_key = prefix + input.test_param.name
1078	else:
1079	test_param_key = group_prefix + input.test_param.name
1080	test_param_error = None
1081	test_incoming = get_incoming_value( incoming, test_param_key, None )
1082	if test_param_key not in incoming \
1083	and "__force_update__" + test_param_key not in incoming \
1084	and update_only:
1085	# Update only, keep previous value and state, but still
1086	# recurse in case there are nested changes
1087	value = group_state[ input.test_param.name ]
1088	current_case = old_current_case
1089	if input.test_param.name in old_errors:
1090	errors[ input.test_param.name ] = old_errors[ input.test_param.name ]
1091	else:
1092	# Get value of test param and determine current case
1093	value, test_param_error = \
1094	check_param( trans, input.test_param, test_incoming, context )
1095	current_case = input.get_current_case( value, trans )
1096	if current_case != old_current_case:
1097	# Current case has changed, throw away old state
1098	group_state = state[input.name] = {}
1099	# TODO: we should try to preserve values if we can
1100	self.fill_in_new_state( trans, input.cases[current_case].inputs, group_state, context )
1101	group_errors = dict()
1102	group_old_errors = dict()
1103	else:
1104	# Current case has not changed, update children
1105	group_errors = self.update_state( trans,
1106	input.cases[current_case].inputs,
1107	group_state,
1108	incoming,
1109	prefix=group_prefix,
1110	context=context,
1111	update_only=update_only,
1112	old_errors=group_old_errors,
1113	item_callback=item_callback )
1114	if test_param_error:
1115	group_errors[ input.test_param.name ] = test_param_error
1116	if group_errors:
1117	errors[ input.name ] = group_errors
1118	# Store the current case in a special value
1119	group_state['__current_case__'] = current_case
1120	# Store the value of the test element
1121	group_state[ input.test_param.name ] = value
1122	elif isinstance( input, UploadDataset ):
1123	group_state = state[input.name]
1124	group_errors = []
1125	group_old_errors = old_errors.get( input.name, None )
1126	any_group_errors = False
1127	d_type = input.get_datatype( trans, context )
1128	writable_files = d_type.writable_files
1129	#remove extra files
1130	while len( group_state ) > len( writable_files ):
1131	del group_state[-1]
1132	if group_old_errors:
1133	del group_old_errors[-1]
1134	# Update state
1135	max_index = -1
1136	for i, rep_state in enumerate( group_state ):
1137	rep_index = rep_state['__index__']
1138	max_index = max( max_index, rep_index )
1139	rep_prefix = "%s_%d\|" % ( key, rep_index )
1140	if group_old_errors:
1141	rep_old_errors = group_old_errors[i]
1142	else:
1143	rep_old_errors = {}
1144	rep_errors = self.update_state( trans,
1145	input.inputs,
1146	rep_state,
1147	incoming,
1148	prefix=rep_prefix,
1149	context=context,
1150	update_only=update_only,
1151	old_errors=rep_old_errors,
1152	item_callback=item_callback )
1153	if rep_errors:
1154	any_group_errors = True
1155	group_errors.append( rep_errors )
1156	else:
1157	group_errors.append( {} )
1158	# Add new fileupload as needed
1159	offset = 1
1160	while len( writable_files ) > len( group_state ):
1161	new_state = {}
1162	new_state['__index__'] = max_index + offset
1163	offset += 1
1164	self.fill_in_new_state( trans, input.inputs, new_state, context )
1165	group_state.append( new_state )
1166	if any_group_errors:
1167	group_errors.append( {} )
1168	# Were there any errors for any repetition?
1169	if any_group_errors:
1170	errors[input.name] = group_errors
1171	else:
1172	if key not in incoming \
1173	and "__force_update__" + key not in incoming \
1174	and update_only:
1175	# No new value provided, and we are only updating, so keep
1176	# the old value (which should already be in the state) and
1177	# preserve the old error message.
1178	if input.name in old_errors:
1179	errors[ input.name ] = old_errors[ input.name ]
1180	else:
1181	incoming_value = get_incoming_value( incoming, key, None )
1182	value, error = check_param( trans, input, incoming_value, context )
1183	# If a callback was provided, allow it to process the value
1184	if item_callback:
1185	old_value = state.get( input.name, None )
1186	value, error = item_callback( trans, key, input, value, error, old_value, context )
1187	if error:
1188	errors[ input.name ] = error
1189	state[ input.name ] = value
1190	return errors
1191
1192	def get_static_param_values( self, trans ):
1193	"""
1194	Returns a map of parameter names and values if the tool does not
1195	require any user input. Will raise an exception if any parameter
1196	does require input.
1197	"""
1198	args = dict()
1199	for key, param in self.inputs.iteritems():
1200	if isinstance( param, HiddenToolParameter ):
1201	args[key] = param.value
1202	elif isinstance( param, BaseURLToolParameter ):
1203	args[key] = param.get_value( trans )
1204	else:
1205	raise Exception( "Unexpected parameter type" )
1206	return args
1207
1208	def execute( self, trans, incoming={}, set_output_hid=True ):
1209	"""
1210	Execute the tool using parameter values in `incoming`. This just
1211	dispatches to the `ToolAction` instance specified by
1212	`self.tool_action`. In general this will create a `Job` that
1213	when run will build the tool's outputs, e.g. `DefaultToolAction`.
1214	"""
1215	return self.tool_action.execute( self, trans, incoming=incoming, set_output_hid=set_output_hid )
1216
1217	def params_to_strings( self, params, app ):
1218	return params_to_strings( self.inputs, params, app )
1219
1220	def params_from_strings( self, params, app, ignore_errors=False ):
1221	return params_from_strings( self.inputs, params, app, ignore_errors )
1222
1223	def check_and_update_param_values( self, values, trans ):
1224	"""
1225	Check that all parameters have values, and fill in with default
1226	values where neccesary. This could be called after loading values
1227	from a database in case new parameters have been added.
1228	"""
1229	messages = {}
1230	self.check_and_update_param_values_helper( self.inputs, values, trans, messages )
1231	return messages
1232
1233	def check_and_update_param_values_helper( self, inputs, values, trans, messages, context=None, prefix="" ):
1234	"""
1235	Recursive helper for `check_and_update_param_values_helper`
1236	"""
1237	context = ExpressionContext( values, context )
1238	for input in inputs.itervalues():
1239	# No value, insert the default
1240	if input.name not in values:
1241	messages[ input.name ] = "No value found for '%s%s', used default" % ( prefix, input.label )
1242	values[ input.name ] = input.get_initial_value( trans, context )
1243	# Value, visit recursively as usual
1244	else:
1245	if isinstance( input, Repeat ):
1246	for i, d in enumerate( values[ input.name ] ):
1247	rep_prefix = prefix + "%s %d > " % ( input.title, i + 1 )
1248	self.check_and_update_param_values_helper( input.inputs, d, trans, messages, context, rep_prefix )
1249	elif isinstance( input, Conditional ):
1250	group_values = values[ input.name ]
1251	if input.test_param.name not in group_values:
1252	# No test param invalidates the whole conditional
1253	values[ input.name ] = group_values = input.get_initial_value( trans, context )
1254	messages[ input.test_param.name ] = "No value found for '%s%s', used default" % ( prefix, input.test_param.label )
1255	current_case = group_values['__current_case__']
1256	for child_input in input.cases[current_case].inputs.itervalues():
1257	messages[ child_input.name ] = "Value no longer valid for '%s%s', replaced with default" % ( prefix, child_input.label )
1258	else:
1259	current = group_values["__current_case__"]
1260	self.check_and_update_param_values_helper( input.cases[current].inputs, group_values, trans, messages, context, prefix )
1261	else:
1262	# Regular tool parameter, no recursion needed
1263	pass
1264
1265	def handle_unvalidated_param_values( self, input_values, app ):
1266	"""
1267	Find any instances of `UnvalidatedValue` within input_values and
1268	validate them (by calling `ToolParameter.from_html` and
1269	`ToolParameter.validate`).
1270	"""
1271	# No validation is done when check_values is False
1272	if not self.check_values:
1273	return
1274	self.handle_unvalidated_param_values_helper( self.inputs, input_values, app )
1275
1276	def handle_unvalidated_param_values_helper( self, inputs, input_values, app, context=None, prefix="" ):
1277	"""
1278	Recursive helper for `handle_unvalidated_param_values`
1279	"""
1280	context = ExpressionContext( input_values, context )
1281	for input in inputs.itervalues():
1282	if isinstance( input, Repeat ):
1283	for i, d in enumerate( input_values[ input.name ] ):
1284	rep_prefix = prefix + "%s %d > " % ( input.title, i + 1 )
1285	self.handle_unvalidated_param_values_helper( input.inputs, d, app, context, rep_prefix )
1286	elif isinstance( input, Conditional ):
1287	values = input_values[ input.name ]
1288	current = values["__current_case__"]
1289	# NOTE: The test param doesn't need to be checked since
1290	# there would be no way to tell what case to use at
1291	# workflow build time. However I'm not sure if we are
1292	# actually preventing such a case explicately.
1293	self.handle_unvalidated_param_values_helper( input.cases[current].inputs, values, app, context, prefix )
1294	else:
1295	# Regular tool parameter
1296	value = input_values[ input.name ]
1297	if isinstance( value, UnvalidatedValue ):
1298	try:
1299	# Convert from html representation
1300	if value.value is None:
1301	# If value.value is None, it could not have been
1302	# submited via html form and therefore .from_html
1303	# can't be guaranteed to work
1304	value = None
1305	else:
1306	value = input.from_html( value.value, None, context )
1307	# Do any further validation on the value
1308	input.validate( value, None )
1309	except Exception, e:
1310	# Wrap an re-raise any generated error so we can
1311	# generate a more informative message
1312	v = input.value_to_display_text( value, self.app )
1313	message = "Failed runtime validation of %s%s (%s)" \
1314	% ( prefix, input.label, e )
1315	raise LateValidationError( message )
1316	input_values[ input.name ] = value
1317
1318	def handle_job_failure_exception( self, e ):
1319	"""
1320	Called by job.fail when an exception is generated to allow generation
1321	of a better error message (returning None yields the default behavior)
1322	"""
1323	message = None
1324	# If the exception was generated by late validation, use its error
1325	# message (contains the parameter name and value)
1326	if isinstance( e, LateValidationError ):
1327	message = e.message
1328	return message
1329
1330	def build_param_dict( self, incoming, input_datasets, output_datasets, output_paths, job_working_directory ):
1331	"""
1332	Build the dictionary of parameters for substituting into the command
1333	line. Each value is wrapped in a `InputValueWrapper`, which allows
1334	all the attributes of the value to be used in the template, but
1335	when the __str__ method is called it actually calls the
1336	`to_param_dict_value` method of the associated input.
1337	"""
1338	param_dict = dict()
1339	# All parameters go into the param_dict
1340	param_dict.update( incoming )
1341	# Wrap parameters as neccesary
1342	def wrap_values( inputs, input_values ):
1343	for input in inputs.itervalues():
1344	if isinstance( input, Repeat ):
1345	for d in input_values[ input.name ]:
1346	wrap_values( input.inputs, d )
1347	elif isinstance( input, Conditional ):
1348	values = input_values[ input.name ]
1349	current = values["__current_case__"]
1350	wrap_values( input.cases[current].inputs, values )
1351	elif isinstance( input, DataToolParameter ):
1352	## FIXME: We're populating param_dict with conversions when
1353	## wrapping values, this should happen as a separate
1354	## step before wrapping (or call this wrapping step
1355	## something more generic) (but iterating this same
1356	## list twice would be wasteful)
1357	# Add explicit conversions by name to current parent
1358	for conversion_name, conversion_extensions, conversion_datatypes in input.conversions:
1359	# If we are at building cmdline step, then converters
1360	# have already executed
1361	conv_ext, converted_dataset = input_values[ input.name ].find_conversion_destination( conversion_datatypes )
1362	# When dealing with optional inputs, we'll provide a
1363	# valid extension to be used for None converted dataset
1364	if not conv_ext:
1365	conv_ext = conversion_extensions[0]
1366	# input_values[ input.name ] is None when optional
1367	# dataset, 'conversion' of optional dataset should
1368	# create wrapper around NoneDataset for converter output
1369	if input_values[ input.name ] and not converted_dataset:
1370	# Input that converter is based from has a value,
1371	# but converted dataset does not exist
1372	raise Exception( 'A path for explicit datatype conversion has not been found: %s --/--> %s'
1373	% ( input_values[ input.name ].extension, conversion_extensions ) )
1374	else:
1375	# Trick wrapper into using target conv ext (when
1376	# None) without actually being a tool parameter
1377	input_values[ conversion_name ] = \
1378	DatasetFilenameWrapper( converted_dataset,
1379	datatypes_registry = self.app.datatypes_registry,
1380	tool = Bunch( conversion_name = Bunch( extensions = conv_ext ) ),
1381	name = conversion_name )
1382	# Wrap actual input dataset
1383	input_values[ input.name ] = \
1384	DatasetFilenameWrapper( input_values[ input.name ],
1385	datatypes_registry = self.app.datatypes_registry,
1386	tool = self,
1387	name = input.name )
1388	elif isinstance( input, SelectToolParameter ):
1389	input_values[ input.name ] = SelectToolParameterWrapper(
1390	input, input_values[ input.name ], self.app, other_values = param_dict )
1391	else:
1392	input_values[ input.name ] = InputValueWrapper(
1393	input, input_values[ input.name ], param_dict )
1394	# HACK: only wrap if check_values is not false, this deals with external
1395	# tools where the inputs don't even get passed through. These
1396	# tools (e.g. UCSC) should really be handled in a special way.
1397	if self.check_values:
1398	wrap_values( self.inputs, param_dict )
1399	## FIXME: when self.check_values==True, input datasets are being wrapped
1400	## twice (above and below, creating 2 separate
1401	## DatasetFilenameWrapper objects - first is overwritten by
1402	## second), is this necessary? - if we get rid of this way to
1403	## access children, can we stop this redundancy, or is there
1404	## another reason for this?
1405	## - Only necessary when self.check_values is False (==external dataset
1406	## tool?: can this be abstracted out as part of being a datasouce tool?)
1407	## - But we still want (ALWAYS) to wrap input datasets (this should be
1408	## checked to prevent overhead of creating a new object?)
1409	# Additionally, datasets go in the param dict. We wrap them such that
1410	# if the bare variable name is used it returns the filename (for
1411	# backwards compatibility). We also add any child datasets to the
1412	# the param dict encoded as:
1413	# "_CHILD___{dataset_name}___{child_designation}",
1414	# but this should be considered DEPRECATED, instead use:
1415	# $dataset.get_child( 'name' ).filename
1416	for name, data in input_datasets.items():
1417	param_dict[name] = DatasetFilenameWrapper( data,
1418	datatypes_registry = self.app.datatypes_registry,
1419	tool = self,
1420	name = name )
1421	if data:
1422	for child in data.children:
1423	param_dict[ "_CHILD___%s___%s" % ( name, child.designation ) ] = DatasetFilenameWrapper( child )
1424	for name, hda in output_datasets.items():
1425	# Write outputs to the working directory (for security purposes)
1426	# if desired.
1427	if self.app.config.outputs_to_working_directory:
1428	try:
1429	false_path = [ dp.false_path for dp in output_paths if dp.real_path == hda.file_name ][0]
1430	param_dict[name] = DatasetFilenameWrapper( hda, false_path = false_path )
1431	open( false_path, 'w' ).close()
1432	except IndexError:
1433	log.warning( "Unable to determine alternate path for writing job outputs, outputs will be written to their real paths" )
1434	param_dict[name] = DatasetFilenameWrapper( hda )
1435	else:
1436	param_dict[name] = DatasetFilenameWrapper( hda )
1437	# Provide access to a path to store additional files
1438	# TODO: path munging for cluster/dataset server relocatability
1439	param_dict[name].files_path = os.path.abspath(os.path.join( job_working_directory, "dataset_%s_files" % (hda.dataset.id) ))
1440	for child in hda.children:
1441	param_dict[ "_CHILD___%s___%s" % ( name, child.designation ) ] = DatasetFilenameWrapper( child )
1442	for out_name, output in self.outputs.iteritems():
1443	if out_name not in param_dict and output.filters:
1444	# Assume the reason we lack this output is because a filter
1445	# failed to pass; for tool writing convienence, provide a
1446	# NoneDataset
1447	param_dict[ out_name ] = NoneDataset( datatypes_registry = self.app.datatypes_registry, ext = output.format )
1448	# We add access to app here, this allows access to app.config, etc
1449	param_dict['__app__'] = RawObjectWrapper( self.app )
1450	# More convienent access to app.config.new_file_path; we don't need to
1451	# wrap a string, but this method of generating additional datasets
1452	# should be considered DEPRECATED
1453	# TODO: path munging for cluster/dataset server relocatability
1454	param_dict['__new_file_path__'] = os.path.abspath(self.app.config.new_file_path)
1455	# The following points to location (xxx.loc) files which are pointers
1456	# to locally cached data
1457	param_dict['GALAXY_DATA_INDEX_DIR'] = self.app.config.tool_data_path
1458	# For the upload tool, we need to know the root directory and the
1459	# datatypes conf path, so we can load the datatypes registry
1460	param_dict['GALAXY_ROOT_DIR'] = os.path.abspath( self.app.config.root )
1461	param_dict['GALAXY_DATATYPES_CONF_FILE'] = os.path.abspath( self.app.config.datatypes_config )
1462	# Return the dictionary of parameters
1463	return param_dict
1464
1465	def build_param_file( self, param_dict, directory=None ):
1466	"""
1467	Build temporary file for file based parameter transfer if needed
1468	"""
1469	if self.command and "$param_file" in self.command:
1470	fd, param_filename = tempfile.mkstemp( dir=directory )
1471	os.close( fd )
1472	f = open( param_filename, "wt" )
1473	for key, value in param_dict.items():
1474	# parameters can be strings or lists of strings, coerce to list
1475	if type(value) != type([]):
1476	value = [ value ]
1477	for elem in value:
1478	f.write( '%s=%s\n' % (key, elem) )
1479	f.close()
1480	param_dict['param_file'] = param_filename
1481	return param_filename
1482	else:
1483	return None
1484
1485	def build_config_files( self, param_dict, directory=None ):
1486	"""
1487	Build temporary file for file based parameter transfer if needed
1488	"""
1489	config_filenames = []
1490	for name, filename, template_text in self.config_files:
1491	# If a particular filename was forced by the config use it
1492	if filename is not None:
1493	if directory is None:
1494	raise Exception( "Config files with fixed filenames require a working directory" )
1495	config_filename = os.path.join( directory, filename )
1496	else:
1497	fd, config_filename = tempfile.mkstemp( dir=directory )
1498	os.close( fd )
1499	f = open( config_filename, "wt" )
1500	f.write( fill_template( template_text, context=param_dict ) )
1501	f.close()
1502	param_dict[name] = config_filename
1503	config_filenames.append( config_filename )
1504	return config_filenames
1505
1506	def build_command_line( self, param_dict ):
1507	"""
1508	Build command line to invoke this tool given a populated param_dict
1509	"""
1510	command_line = None
1511	if not self.command:
1512	return
1513	try:
1514	# Substituting parameters into the command
1515	command_line = fill_template( self.command, context=param_dict )
1516	# Remove newlines from command line
1517	command_line = command_line.replace( "\n", " " ).replace( "\r", " " )
1518	except Exception, e:
1519	# Modify exception message to be more clear
1520	#e.args = ( 'Error substituting into command line. Params: %r, Command: %s' % ( param_dict, self.command ) )
1521	raise
1522	return command_line
1523
1524	def build_dependency_shell_commands( self ):
1525	"""
1526	Return a list of commands to be run to populate the current
1527	environment to include this tools requirements.
1528	"""
1529	commands = []
1530	for requirement in self.requirements:
1531	# TODO: currently only supporting requirements of type package,
1532	# need to implement some mechanism for mapping other types
1533	# back to packages
1534	log.debug( "Dependency %s", requirement.name )
1535	if requirement.type == 'package':
1536	script_file, base_path, version = self.app.toolbox.dependency_manager.find_dep( requirement.name, requirement.version )
1537	if script_file is None:
1538	log.warn( "Failed to resolve dependency on '%s', ignoring", requirement.name )
1539	else:
1540	commands.append( 'PACKAGE_BASE=%s source %s' % ( base_path, script_file ) )
1541	return commands
1542
1543	def build_redirect_url_params( self, param_dict ):
1544	"""
1545	Substitute parameter values into self.redirect_url_params
1546	"""
1547	if not self.redirect_url_params:
1548	return
1549	redirect_url_params = None
1550	# Substituting parameter values into the url params
1551	redirect_url_params = fill_template( self.redirect_url_params, context=param_dict )
1552	# Remove newlines
1553	redirect_url_params = redirect_url_params.replace( "\n", " " ).replace( "\r", " " )
1554	return redirect_url_params
1555
1556	def parse_redirect_url( self, data, param_dict ):
1557	"""
1558	Parse the REDIRECT_URL tool param. Tools that send data to an external
1559	application via a redirect must include the following 3 tool params:
1560
1561	1) REDIRECT_URL - the url to which the data is being sent
1562
1563	2) DATA_URL - the url to which the receiving application will send an
1564	http post to retrieve the Galaxy data
1565
1566	3) GALAXY_URL - the url to which the external application may post
1567	data as a response
1568	"""
1569	redirect_url = param_dict.get( 'REDIRECT_URL' )
1570	redirect_url_params = self.build_redirect_url_params( param_dict )
1571	# Add the parameters to the redirect url. We're splitting the param
1572	# string on '^' because the self.parse() method replaced white
1573	# space with that separator.
1574	params = redirect_url_params.split( '^' )
1575	rup_dict = {}
1576	for param in params:
1577	p_list = param.split( '=' )
1578	p_name = p_list[0]
1579	p_val = p_list[1]
1580	rup_dict[ p_name ] = p_val
1581	DATA_URL = param_dict.get( 'DATA_URL', None )
1582	assert DATA_URL is not None, "DATA_URL parameter missing in tool config."
1583	DATA_URL += "/%s/display" % str( data.id )
1584	redirect_url += "?DATA_URL=%s" % DATA_URL
1585	# Add the redirect_url_params to redirect_url
1586	for p_name in rup_dict:
1587	redirect_url += "&%s=%s" % ( p_name, rup_dict[ p_name ] )
1588	# Add the current user email to redirect_url
1589	if data.history.user:
1590	USERNAME = str( data.history.user.email )
1591	else:
1592	USERNAME = 'Anonymous'
1593	redirect_url += "&USERNAME=%s" % USERNAME
1594	return redirect_url
1595
1596	def call_hook( self, hook_name, args, *kwargs ):
1597	"""
1598	Call the custom code hook function identified by 'hook_name' if any,
1599	and return the results
1600	"""
1601	try:
1602	code = self.get_hook( hook_name )
1603	if code:
1604	return code( args, *kwargs )
1605	except Exception, e:
1606	e.args = ( "Error in '%s' hook '%s', original message: %s" % ( self.name, hook_name, e.args[0] ) )
1607	raise
1608
1609	def exec_before_job( self, app, inp_data, out_data, param_dict={} ):
1610	pass
1611
1612	def exec_after_process( self, app, inp_data, out_data, param_dict, job = None ):
1613	pass
1614
1615	def job_failed( self, job_wrapper, message, exception = False ):
1616	"""
1617	Called when a job has failed
1618	"""
1619	pass
1620
1621	def collect_associated_files( self, output, job_working_directory ):
1622	"""
1623	Find extra files in the job working directory and move them into
1624	the appropriate dataset's files directory
1625	"""
1626	for name, hda in output.items():
1627	temp_file_path = os.path.join( job_working_directory, "dataset_%s_files" % ( hda.dataset.id ) )
1628	try:
1629	if len( os.listdir( temp_file_path ) ) > 0:
1630	store_file_path = os.path.join(
1631	os.path.join( self.app.config.file_path, *directory_hash_id( hda.dataset.id ) ),
1632	"dataset_%d_files" % hda.dataset.id )
1633	shutil.move( temp_file_path, store_file_path )
1634	# Fix permissions
1635	for basedir, dirs, files in os.walk( store_file_path ):
1636	util.umask_fix_perms( basedir, self.app.config.umask, 0777, self.app.config.gid )
1637	for file in files:
1638	path = os.path.join( basedir, file )
1639	# Ignore symlinks
1640	if os.path.islink( path ):
1641	continue
1642	util.umask_fix_perms( path, self.app.config.umask, 0666, self.app.config.gid )
1643	except:
1644	continue
1645
1646	def collect_child_datasets( self, output):
1647	"""
1648	Look for child dataset files, create HDA and attach to parent.
1649	"""
1650	children = {}
1651	# Loop through output file names, looking for generated children in
1652	# form of 'child_parentId_designation_visibility_extension'
1653	for name, outdata in output.items():
1654	for filename in glob.glob(os.path.join(self.app.config.new_file_path,"child_%i_*" % outdata.id) ):
1655	if not name in children:
1656	children[name] = {}
1657	fields = os.path.basename(filename).split("_")
1658	fields.pop(0)
1659	parent_id = int(fields.pop(0))
1660	designation = fields.pop(0)
1661	visible = fields.pop(0).lower()
1662	if visible == "visible": visible = True
1663	else: visible = False
1664	ext = fields.pop(0).lower()
1665	child_dataset = self.app.model.HistoryDatasetAssociation( extension=ext,
1666	parent_id=outdata.id,
1667	designation=designation,
1668	visible=visible,
1669	dbkey=outdata.dbkey,
1670	create_dataset=True,
1671	sa_session=self.sa_session )
1672	self.app.security_agent.copy_dataset_permissions( outdata.dataset, child_dataset.dataset )
1673	# Move data from temp location to dataset location
1674	shutil.move( filename, child_dataset.file_name )
1675	self.sa_session.add( child_dataset )
1676	self.sa_session.flush()
1677	child_dataset.set_size()
1678	child_dataset.name = "Secondary Dataset (%s)" % ( designation )
1679	child_dataset.init_meta()
1680	child_dataset.set_meta()
1681	child_dataset.set_peek()
1682	# Associate new dataset with job
1683	job = None
1684	for assoc in outdata.creating_job_associations:
1685	job = assoc.job
1686	break
1687	if job:
1688	assoc = self.app.model.JobToOutputDatasetAssociation( '__new_child_file_%s\|%s__' % ( name, designation ), child_dataset )
1689	assoc.job = job
1690	self.sa_session.add( assoc )
1691	self.sa_session.flush()
1692	child_dataset.state = outdata.state
1693	self.sa_session.add( child_dataset )
1694	self.sa_session.flush()
1695	# Add child to return dict
1696	children[name][designation] = child_dataset
1697	# Need to update all associated output hdas, i.e. history was
1698	# shared with job running
1699	for dataset in outdata.dataset.history_associations:
1700	if outdata == dataset: continue
1701	# Create new child dataset
1702	child_data = child_dataset.copy( parent_id = dataset.id )
1703	self.sa_session.add( child_dataset )
1704	self.sa_session.flush()
1705	return children
1706
1707	def collect_primary_datasets( self, output):
1708	"""
1709	Find any additional datasets generated by a tool and attach (for
1710	cases where number of outputs is not known in advance).
1711	"""
1712	primary_datasets = {}
1713	# Loop through output file names, looking for generated primary
1714	# datasets in form of:
1715	# 'primary_associatedWithDatasetID_designation_visibility_extension(_DBKEY)'
1716	for name, outdata in output.items():
1717	for filename in glob.glob(os.path.join(self.app.config.new_file_path,"primary_%i_*" % outdata.id) ):
1718	if not name in primary_datasets:
1719	primary_datasets[name] = {}
1720	fields = os.path.basename(filename).split("_")
1721	fields.pop(0)
1722	parent_id = int(fields.pop(0))
1723	designation = fields.pop(0)
1724	visible = fields.pop(0).lower()
1725	if visible == "visible": visible = True
1726	else: visible = False
1727	ext = fields.pop(0).lower()
1728	dbkey = outdata.dbkey
1729	if fields:
1730	dbkey = fields[ 0 ]
1731	# Create new primary dataset
1732	primary_data = self.app.model.HistoryDatasetAssociation( extension=ext,
1733	designation=designation,
1734	visible=visible,
1735	dbkey=dbkey,
1736	create_dataset=True,
1737	sa_session=self.sa_session )
1738	self.app.security_agent.copy_dataset_permissions( outdata.dataset, primary_data.dataset )
1739	self.sa_session.add( primary_data )
1740	self.sa_session.flush()
1741	# Move data from temp location to dataset location
1742	shutil.move( filename, primary_data.file_name )
1743	primary_data.set_size()
1744	primary_data.name = outdata.name
1745	primary_data.info = outdata.info
1746	primary_data.init_meta( copy_from=outdata )
1747	primary_data.dbkey = dbkey
1748	primary_data.set_meta()
1749	primary_data.set_peek()
1750	# Associate new dataset with job
1751	job = None
1752	for assoc in outdata.creating_job_associations:
1753	job = assoc.job
1754	break
1755	if job:
1756	assoc = self.app.model.JobToOutputDatasetAssociation( '__new_primary_file_%s\|%s__' % ( name, designation ), primary_data )
1757	assoc.job = job
1758	self.sa_session.add( assoc )
1759	self.sa_session.flush()
1760	primary_data.state = outdata.state
1761	self.sa_session.add( primary_data )
1762	self.sa_session.flush()
1763	outdata.history.add_dataset( primary_data )
1764	# Add dataset to return dict
1765	primary_datasets[name][designation] = primary_data
1766	# Need to update all associated output hdas, i.e. history was
1767	# shared with job running
1768	for dataset in outdata.dataset.history_associations:
1769	if outdata == dataset: continue
1770	new_data = primary_data.copy()
1771	dataset.history.add( new_data )
1772	self.sa_session.add( new_data )
1773	self.sa_session.flush()
1774	return primary_datasets
1775
1776	class DataSourceTool( Tool ):
1777	"""
1778	Alternate implementation of Tool for data_source tools -- those that
1779	allow the user to query and extract data from another web site.
1780	"""
1781	tool_type = 'data_source'
1782
1783	def _build_GALAXY_URL_parameter( self ):
1784	return ToolParameter.build( self, ElementTree.XML( '<param name="GALAXY_URL" type="baseurl" value="/tool_runner?tool_id=%s" />' % self.id ) )
1785
1786	def parse_inputs( self, root ):
1787	Tool.parse_inputs( self, root )
1788	if 'GALAXY_URL' not in self.inputs:
1789	self.inputs[ 'GALAXY_URL' ] = self._build_GALAXY_URL_parameter()
1790
1791	def exec_before_job( self, app, inp_data, out_data, param_dict={} ):
1792	# TODO: Allow for a generic way for all Tools to have output dataset
1793	# properties be set to input parameter values as defined in a
1794	# tool XML
1795	dbkey = param_dict.get( 'dbkey' )
1796	organism = param_dict.get( 'organism' )
1797	table = param_dict.get( 'table' )
1798	description = param_dict.get( 'description' )
1799	info = param_dict.get( 'info' )
1800	if description == 'range':
1801	description = param_dict.get( 'position', '' )
1802	if not description:
1803	description = 'unknown position'
1804	gb_landmark_region = param_dict.get( 'q' )
1805	data_type = param_dict.get( 'data_type' )
1806	items = out_data.items()
1807	for name, data in items:
1808	if organism and table and description:
1809	# This is UCSC
1810	data.name = '%s on %s: %s (%s)' % ( data.name, organism, table, description )
1811	elif gb_landmark_region:
1812	# This is GBrowse
1813	data.name = '%s on %s' % ( data.name, gb_landmark_region )
1814	data.info = info
1815	data.dbkey = dbkey
1816	if data_type not in app.datatypes_registry.datatypes_by_extension:
1817	# Setting data_type to tabular will force the data to be sniffed in exec_after_process()
1818	data_type = 'tabular'
1819	data.change_datatype( data_type )
1820	# Store external data source's request parameters temporarily in
1821	# output file. In case the config setting for
1822	# "outputs_to_working_directory" is True, we must write to the
1823	# DatasetFilenameWrapper object in the param_dict since it's
1824	# "false_path" attribute is the temporary path to the output dataset
1825	# ( until the job is run ). However, even if the
1826	# "outputs_to_working_directory" setting is False, we can still
1827	# open the file the same way for temporarily storing the request
1828	# parameters.
1829	## TODO: Input parameters should be jsonified and written into a
1830	## <configfile> and passed to data_source.py, instead of
1831	## writing tab separated key, value pairs to the output file
1832	out = open( str( param_dict.get( name ) ), 'w' )
1833	for key, value in param_dict.items():
1834	print >> out, '%s\t%s' % ( key, value )
1835	out.close()
1836
1837	def exec_after_process( self, app, inp_data, out_data, param_dict, job = None ):
1838	name, data = out_data.items()[0]
1839	data.set_size()
1840	#TODO: these should be already be set before the tool runs:
1841	if data.state == data.states.OK:
1842	data.name = param_dict.get( 'name', data.name )
1843	data.info = param_dict.get( 'info', data.name )
1844	data.dbkey = param_dict.get( 'dbkey', data.dbkey )
1845	data.extension = param_dict.get( 'data_type', data.extension )
1846	#TODO: these should be possible as part of data_source.py and external set_meta, see the upload tool:
1847	if data.extension in [ 'txt', 'tabular' ]:
1848	data_type = sniff.guess_ext( data.file_name, sniff_order=app.datatypes_registry.sniff_order, is_multi_byte=self.is_multi_byte )
1849	if data.extension != data_type:
1850	data.change_datatype( data_type )
1851	elif not isinstance( data.datatype, datatypes.interval.Bed ) and isinstance( data.datatype, datatypes.interval.Interval ):
1852	if data.missing_meta():
1853	data.change_datatype( 'tabular' )
1854	data.set_peek()
1855	self.sa_session.add( data )
1856	self.sa_session.flush()
1857
1858	class AsyncDataSourceTool( DataSourceTool ):
1859	tool_type = 'data_source_async'
1860
1861	def _build_GALAXY_URL_parameter( self ):
1862	return ToolParameter.build( self, ElementTree.XML( '<param name="GALAXY_URL" type="baseurl" value="/async/%s" />' % self.id ) )
1863
1864	class DataDestinationTool( Tool ):
1865	tool_type = 'data_destination'
1866
1867	class SetMetadataTool( Tool ):
1868	"""
1869	Tool implementation for special tool that sets metadata on an existing
1870	dataset.
1871	"""
1872	tool_type = 'set_metadata'
1873	def exec_after_process( self, app, inp_data, out_data, param_dict, job = None ):
1874	for name, dataset in inp_data.iteritems():
1875	external_metadata = galaxy.datatypes.metadata.JobExternalOutputMetadataWrapper( job )
1876	if external_metadata.external_metadata_set_successfully( dataset, app.model.context ):
1877	dataset.metadata.from_JSON_dict( external_metadata.get_output_filenames_by_dataset( dataset, app.model.context ).filename_out )
1878	else:
1879	dataset._state = model.Dataset.states.FAILED_METADATA
1880	self.sa_session.add( dataset )
1881	self.sa_session.flush()
1882	return
1883	# If setting external metadata has failed, how can we inform the
1884	# user? For now, we'll leave the default metadata and set the state
1885	# back to its original.
1886	dataset.datatype.after_setting_metadata( dataset )
1887	if job and job.tool_id == '1.0.0':
1888	dataset.state = param_dict.get( '__ORIGINAL_DATASET_STATE__' )
1889	else:
1890	# Revert dataset.state to fall back to dataset.dataset.state
1891	dataset._state = None
1892	# Need to reset the peek, which may rely on metadata
1893	dataset.set_peek()
1894	self.sa_session.add( dataset )
1895	self.sa_session.flush()
1896
1897	def job_failed( self, job_wrapper, message, exception = False ):
1898	job = job_wrapper.sa_session.query( model.Job ).get( job_wrapper.job_id )
1899	if job:
1900	inp_data = {}
1901	for dataset_assoc in job.input_datasets:
1902	inp_data[dataset_assoc.name] = dataset_assoc.dataset
1903	return self.exec_after_process( job_wrapper.app, inp_data, {}, job_wrapper.get_param_dict(), job = job )
1904
1905	class ExportHistoryTool( Tool ):
1906	tool_type = 'export_history'
1907
1908	# Populate tool_type to ToolClass mappings
1909	tool_types = {}
1910	for tool_class in [ Tool, DataDestinationTool, SetMetadataTool, DataSourceTool, AsyncDataSourceTool ]:
1911	tool_types[ tool_class.tool_type ] = tool_class
1912
1913	# ---- Utility classes to be factored out -----------------------------------
1914
1915	class BadValue( object ):
1916	def __init__( self, value ):
1917	self.value = value
1918
1919	class RawObjectWrapper( object ):
1920	"""
1921	Wraps an object so that __str__ returns module_name:class_name.
1922	"""
1923	def __init__( self, obj ):
1924	self.obj = obj
1925	def __str__( self ):
1926	return "%s:%s" % (self.obj.__module__, self.obj.__class__.__name__)
1927	def __getattr__( self, key ):
1928	return getattr( self.obj, key )
1929
1930	class InputValueWrapper( object ):
1931	"""
1932	Wraps an input so that __str__ gives the "param_dict" representation.
1933	"""
1934	def __init__( self, input, value, other_values={} ):
1935	self.input = input
1936	self.value = value
1937	self._other_values = other_values
1938	def __str__( self ):
1939	return self.input.to_param_dict_string( self.value, self._other_values )
1940	def __getattr__( self, key ):
1941	return getattr( self.value, key )
1942
1943	class SelectToolParameterWrapper( object ):
1944	"""
1945	Wraps a SelectTooParameter so that __str__ returns the selected value, but all other
1946	attributes are accessible.
1947	"""
1948	def __init__( self, input, value, app, other_values={} ):
1949	self.input = input
1950	self.value = value
1951	self.input.value_label = input.value_to_display_text( value, app )
1952	self._other_values = other_values
1953	def __str__( self ):
1954	return self.input.to_param_dict_string( self.value, other_values = self._other_values )
1955	def __getattr__( self, key ):
1956	return getattr( self.input, key )
1957
1958	class DatasetFilenameWrapper( object ):
1959	"""
1960	Wraps a dataset so that __str__ returns the filename, but all other
1961	attributes are accessible.
1962	"""
1963
1964	class MetadataWrapper:
1965	"""
1966	Wraps a Metadata Collection to return MetadataParameters wrapped
1967	according to the metadata spec. Methods implemented to match behavior
1968	of a Metadata Collection.
1969	"""
1970	def __init__( self, metadata ):
1971	self.metadata = metadata
1972	def __getattr__( self, name ):
1973	rval = self.metadata.get( name, None )
1974	if name in self.metadata.spec:
1975	if rval is None:
1976	rval = self.metadata.spec[name].no_value
1977	rval = self.metadata.spec[name].param.to_string( rval )
1978	# Store this value, so we don't need to recalculate if needed
1979	# again
1980	setattr( self, name, rval )
1981	return rval
1982	def __nonzero__( self ):
1983	return self.metadata.__nonzero__()
1984	def __iter__( self ):
1985	return self.metadata.__iter__()
1986	def get( self, key, default=None ):
1987	try:
1988	return getattr( self, key )
1989	except:
1990	return default
1991	def items( self ):
1992	return iter( [ ( k, self.get( k ) ) for k, v in self.metadata.items() ] )
1993
1994	def __init__( self, dataset, datatypes_registry = None, tool = None, name = None, false_path = None ):
1995	if not dataset:
1996	try:
1997	# TODO: allow this to work when working with grouping
1998	ext = tool.inputs[name].extensions[0]
1999	except:
2000	ext = 'data'
2001	self.dataset = NoneDataset( datatypes_registry = datatypes_registry, ext = ext )
2002	else:
2003	self.dataset = dataset
2004	self.metadata = self.MetadataWrapper( dataset.metadata )
2005	self.false_path = false_path
2006
2007	def __str__( self ):
2008	if self.false_path is not None:
2009	return self.false_path
2010	else:
2011	return self.dataset.file_name
2012
2013	def __getattr__( self, key ):
2014	if self.false_path is not None and key == 'file_name':
2015	return self.false_path
2016	else:
2017	return getattr( self.dataset, key )
2018
2019	def json_fix( val ):
2020	if isinstance( val, list ):
2021	return [ json_fix( v ) for v in val ]
2022	elif isinstance( val, dict ):
2023	return dict( [ ( json_fix( k ), json_fix( v ) ) for ( k, v ) in val.iteritems() ] )
2024	elif isinstance( val, unicode ):
2025	return val.encode( "utf8" )
2026	else:
2027	return val
2028
2029	def get_incoming_value( incoming, key, default ):
2030	if "__" + key + "__is_composite" in incoming:
2031	composite_keys = incoming["__" + key + "__keys"].split()
2032	value = dict()
2033	for composite_key in composite_keys:
2034	value[composite_key] = incoming[key + "_" + composite_key]
2035	return value
2036	else:
2037	return incoming.get( key, default )
2038
2039	class InterruptedUpload( Exception ):
2040	pass

Note: リポジトリブラウザについてのヘルプは TracBrowser を参照してください。

Context Navigation

root/galaxy-central/lib/galaxy/tools/__init__.py @ 2

異なるフォーマットでダウンロード:

root/galaxy-central/lib/galaxy/tools/init.py @ 2