Context Navigation

upload_common.py @ 2

リビジョン 2, 19.3 KB (コミッタ: hatakeyama, 14 年前)
import galaxy-central

Rev	行番号
[2]	1	import os, tempfile, StringIO
	2	from cgi import FieldStorage
	3	from galaxy import datatypes, util
	4	from galaxy.util.odict import odict
	5	from galaxy.datatypes import sniff
	6	from galaxy.util.json import to_json_string
	7	from galaxy.model.orm import eagerload_all
	8
	9	import logging
	10	log = logging.getLogger( __name__ )
	11
	12	def persist_uploads( params ):
	13	"""
	14	Turn any uploads in the submitted form to persisted files.
	15	"""
	16	if 'files' in params:
	17	new_files = []
	18	temp_files = []
	19	for upload_dataset in params['files']:
	20	f = upload_dataset['file_data']
	21	if isinstance( f, FieldStorage ):
	22	assert not isinstance( f.file, StringIO.StringIO )
	23	assert f.file.name != '<fdopen>'
	24	local_filename = util.mkstemp_ln( f.file.name, 'upload_file_data_' )
	25	f.file.close()
	26	upload_dataset['file_data'] = dict( filename = f.filename,
	27	local_filename = local_filename )
	28	elif type( f ) == dict and 'filename' and 'local_filename' not in f:
	29	raise Exception( 'Uploaded file was encoded in a way not understood by Galaxy.' )
	30	if upload_dataset['url_paste'].strip() != '':
	31	upload_dataset['url_paste'], is_multi_byte = datatypes.sniff.stream_to_file( StringIO.StringIO( upload_dataset['url_paste'] ), prefix="strio_url_paste_" )
	32	else:
	33	upload_dataset['url_paste'] = None
	34	new_files.append( upload_dataset )
	35	params['files'] = new_files
	36	return params
	37	def handle_library_params( trans, params, folder_id, replace_dataset=None ):
	38	# FIXME: the received params has already been parsed by util.Params() by the time it reaches here,
	39	# so no complex objects remain. This is not good because it does not allow for those objects to be
	40	# manipulated here. The receivd params should be the original kwd from the initial request.
	41	library_bunch = util.bunch.Bunch()
	42	library_bunch.replace_dataset = replace_dataset
	43	library_bunch.message = params.get( 'ldda_message', '' )
	44	# See if we have any template field contents
	45	library_bunch.template_field_contents = []
	46	template_id = params.get( 'template_id', None )
	47	library_bunch.folder = trans.sa_session.query( trans.app.model.LibraryFolder ).get( trans.security.decode_id( folder_id ) )
	48	# We are inheriting the folder's info_association, so we may have received inherited contents or we may have redirected
	49	# here after the user entered template contents ( due to errors ).
	50	if template_id not in [ None, 'None' ]:
	51	library_bunch.template = trans.sa_session.query( trans.app.model.FormDefinition ).get( template_id )
	52	for field_index in range( len( library_bunch.template.fields ) ):
	53	field_name = 'field_%i' % field_index
	54	if params.get( field_name, False ):
	55	field_value = util.restore_text( params.get( field_name, '' ) )
	56	library_bunch.template_field_contents.append( field_value )
	57	else:
	58	library_bunch.template = None
	59	library_bunch.roles = []
	60	for role_id in util.listify( params.get( 'roles', [] ) ):
	61	role = trans.sa_session.query( trans.app.model.Role ).get( role_id )
	62	library_bunch.roles.append( role )
	63	return library_bunch
	64	def get_precreated_datasets( trans, params, data_obj, controller='root' ):
	65	"""
	66	Get any precreated datasets (when using asynchronous uploads).
	67	"""
	68	rval = []
	69	async_datasets = []
	70	if params.get( 'async_datasets', None ) not in ["None", "", None]:
	71	async_datasets = params['async_datasets'].split(',')
	72	current_user_roles = trans.get_current_user_roles()
	73	for id in async_datasets:
	74	try:
	75	data = trans.sa_session.query( data_obj ).get( int( id ) )
	76	except:
	77	log.exception( 'Unable to load precreated dataset (%s) sent in upload form' % id )
	78	continue
	79	if data_obj is trans.app.model.HistoryDatasetAssociation:
	80	if trans.user is None and trans.galaxy_session.current_history != data.history:
	81	log.error( 'Got a precreated dataset (%s) but it does not belong to anonymous user\'s current session (%s)' % ( data.id, trans.galaxy_session.id ) )
	82	elif data.history.user != trans.user:
	83	log.error( 'Got a precreated dataset (%s) but it does not belong to current user (%s)' % ( data.id, trans.user.id ) )
	84	else:
	85	rval.append( data )
	86	elif data_obj is trans.app.model.LibraryDatasetDatasetAssociation:
	87	if controller == 'library' and not trans.app.security_agent.can_add_library_item( current_user_roles, data.library_dataset.folder ):
	88	log.error( 'Got a precreated dataset (%s) but this user (%s) is not allowed to write to it' % ( data.id, trans.user.id ) )
	89	else:
	90	rval.append( data )
	91	return rval
	92	def get_precreated_dataset( precreated_datasets, name ):
	93	"""
	94	Return a dataset matching a name from the list of precreated (via async
	95	upload) datasets. If there's more than one upload with the exact same
	96	name, we need to pop one (the first) so it isn't chosen next time.
	97	"""
	98	names = [ d.name for d in precreated_datasets ]
	99	if names.count( name ) > 0:
	100	return precreated_datasets.pop( names.index( name ) )
	101	else:
	102	return None
	103	def cleanup_unused_precreated_datasets( precreated_datasets ):
	104	for data in precreated_datasets:
	105	log.info( 'Cleaned up unclaimed precreated dataset (%s).' % ( data.id ) )
	106	data.state = data.states.ERROR
	107	data.info = 'No file contents were available.'
	108
	109	def new_history_upload( trans, uploaded_dataset, state=None ):
	110	hda = trans.app.model.HistoryDatasetAssociation( name = uploaded_dataset.name,
	111	extension = uploaded_dataset.file_type,
	112	dbkey = uploaded_dataset.dbkey,
	113	history = trans.history,
	114	create_dataset = True,
	115	sa_session = trans.sa_session )
	116	if state:
	117	hda.state = state
	118	else:
	119	hda.state = hda.states.QUEUED
	120	trans.sa_session.add( hda )
	121	trans.sa_session.flush()
	122	trans.history.add_dataset( hda, genome_build = uploaded_dataset.dbkey )
	123	permissions = trans.app.security_agent.history_get_default_permissions( trans.history )
	124	trans.app.security_agent.set_all_dataset_permissions( hda.dataset, permissions )
	125	trans.sa_session.flush()
	126	return hda
	127	def new_library_upload( trans, cntrller, uploaded_dataset, library_bunch, state=None ):
	128	current_user_roles = trans.get_current_user_roles()
	129	if not ( ( trans.user_is_admin() and cntrller in [ 'library_admin', 'api' ] ) or trans.app.security_agent.can_add_library_item( current_user_roles, library_bunch.folder ) ):
	130	# This doesn't have to be pretty - the only time this should happen is if someone's being malicious.
	131	raise Exception( "User is not authorized to add datasets to this library." )
	132	folder = library_bunch.folder
	133	if uploaded_dataset.get( 'in_folder', False ):
	134	# Create subfolders if desired
	135	for name in uploaded_dataset.in_folder.split( os.path.sep ):
	136	trans.sa_session.refresh( folder )
	137	matches = filter( lambda x: x.name == name, active_folders( trans, folder ) )
	138	if matches:
	139	folder = matches[0]
	140	else:
	141	new_folder = trans.app.model.LibraryFolder( name=name, description='Automatically created by upload tool' )
	142	new_folder.genome_build = util.dbnames.default_value
	143	folder.add_folder( new_folder )
	144	trans.sa_session.add( new_folder )
	145	trans.sa_session.flush()
	146	trans.app.security_agent.copy_library_permissions( folder, new_folder )
	147	folder = new_folder
	148	if library_bunch.replace_dataset:
	149	ld = library_bunch.replace_dataset
	150	else:
	151	ld = trans.app.model.LibraryDataset( folder=folder, name=uploaded_dataset.name )
	152	trans.sa_session.add( ld )
	153	trans.sa_session.flush()
	154	trans.app.security_agent.copy_library_permissions( folder, ld )
	155	ldda = trans.app.model.LibraryDatasetDatasetAssociation( name = uploaded_dataset.name,
	156	extension = uploaded_dataset.file_type,
	157	dbkey = uploaded_dataset.dbkey,
	158	library_dataset = ld,
	159	user = trans.user,
	160	create_dataset = True,
	161	sa_session = trans.sa_session )
	162	trans.sa_session.add( ldda )
	163	if state:
	164	ldda.state = state
	165	else:
	166	ldda.state = ldda.states.QUEUED
	167	ldda.message = library_bunch.message
	168	trans.sa_session.flush()
	169	# Permissions must be the same on the LibraryDatasetDatasetAssociation and the associated LibraryDataset
	170	trans.app.security_agent.copy_library_permissions( ld, ldda )
	171	if library_bunch.replace_dataset:
	172	# Copy the Dataset level permissions from replace_dataset to the new LibraryDatasetDatasetAssociation.dataset
	173	trans.app.security_agent.copy_dataset_permissions( library_bunch.replace_dataset.library_dataset_dataset_association.dataset, ldda.dataset )
	174	else:
	175	# Copy the current user's DefaultUserPermissions to the new LibraryDatasetDatasetAssociation.dataset
	176	trans.app.security_agent.set_all_dataset_permissions( ldda.dataset, trans.app.security_agent.user_get_default_permissions( trans.user ) )
	177	folder.add_library_dataset( ld, genome_build=uploaded_dataset.dbkey )
	178	trans.sa_session.add( folder )
	179	trans.sa_session.flush()
	180	ld.library_dataset_dataset_association_id = ldda.id
	181	trans.sa_session.add( ld )
	182	trans.sa_session.flush()
	183	# Handle template included in the upload form, if any. If the upload is not asynchronous ( e.g., URL paste ),
	184	# then the template and contents will be included in the library_bunch at this point. If the upload is
	185	# asynchronous ( e.g., uploading a file ), then the template and contents will be included in the library_bunch
	186	# in the get_uploaded_datasets() method below.
	187	if library_bunch.template and library_bunch.template_field_contents:
	188	# Since information templates are inherited, the template fields can be displayed on the upload form.
	189	# If the user has added field contents, we'll need to create a new form_values and info_association
	190	# for the new library_dataset_dataset_association object.
	191	# Create a new FormValues object, using the template we previously retrieved
	192	form_values = trans.app.model.FormValues( library_bunch.template, library_bunch.template_field_contents )
	193	trans.sa_session.add( form_values )
	194	trans.sa_session.flush()
	195	# Create a new info_association between the current ldda and form_values
	196	# TODO: Currently info_associations at the ldda level are not inheritable to the associated LibraryDataset,
	197	# we need to figure out if this is optimal
	198	info_association = trans.app.model.LibraryDatasetDatasetInfoAssociation( ldda, library_bunch.template, form_values )
	199	trans.sa_session.add( info_association )
	200	trans.sa_session.flush()
	201	# If roles were selected upon upload, restrict access to the Dataset to those roles
	202	if library_bunch.roles:
	203	for role in library_bunch.roles:
	204	dp = trans.app.model.DatasetPermissions( trans.app.security_agent.permitted_actions.DATASET_ACCESS.action, ldda.dataset, role )
	205	trans.sa_session.add( dp )
	206	trans.sa_session.flush()
	207	return ldda
	208	def new_upload( trans, cntrller, uploaded_dataset, library_bunch=None, state=None ):
	209	if library_bunch:
	210	return new_library_upload( trans, cntrller, uploaded_dataset, library_bunch, state )
	211	else:
	212	return new_history_upload( trans, uploaded_dataset, state )
	213	def get_uploaded_datasets( trans, cntrller, params, precreated_datasets, dataset_upload_inputs, library_bunch=None ):
	214	uploaded_datasets = []
	215	for dataset_upload_input in dataset_upload_inputs:
	216	uploaded_datasets.extend( dataset_upload_input.get_uploaded_datasets( trans, params ) )
	217	for uploaded_dataset in uploaded_datasets:
	218	data = get_precreated_dataset( precreated_datasets, uploaded_dataset.name )
	219	if not data:
	220	data = new_upload( trans, cntrller, uploaded_dataset, library_bunch )
	221	else:
	222	data.extension = uploaded_dataset.file_type
	223	data.dbkey = uploaded_dataset.dbkey
	224	trans.sa_session.add( data )
	225	trans.sa_session.flush()
	226	if library_bunch:
	227	library_bunch.folder.genome_build = uploaded_dataset.dbkey
	228	trans.sa_session.add( library_bunch.folder )
	229	# Handle template included in the upload form, if any. If the upload is asynchronous ( e.g., file upload ),
	230	# then the template and contents will be included in the library_bunch at this point. If the upload is
	231	# not asynchronous ( e.g., URL paste ), then the template and contents will be included in the library_bunch
	232	# in the new_library_upload() method above.
	233	if library_bunch.template and library_bunch.template_field_contents:
	234	# Since information templates are inherited, the template fields can be displayed on the upload form.
	235	# If the user has added field contents, we'll need to create a new form_values and info_association
	236	# for the new library_dataset_dataset_association object.
	237	# Create a new FormValues object, using the template we previously retrieved
	238	form_values = trans.app.model.FormValues( library_bunch.template, library_bunch.template_field_contents )
	239	trans.sa_session.add( form_values )
	240	trans.sa_session.flush()
	241	# Create a new info_association between the current ldda and form_values
	242	# TODO: Currently info_associations at the ldda level are not inheritable to the associated LibraryDataset,
	243	# we need to figure out if this is optimal
	244	info_association = trans.app.model.LibraryDatasetDatasetInfoAssociation( data, library_bunch.template, form_values )
	245	trans.sa_session.add( info_association )
	246	trans.sa_session.flush()
	247	else:
	248	trans.history.genome_build = uploaded_dataset.dbkey
	249	uploaded_dataset.data = data
	250	return uploaded_datasets
	251	def create_paramfile( trans, uploaded_datasets ):
	252	"""
	253	Create the upload tool's JSON "param" file.
	254	"""
	255	json_file = tempfile.mkstemp()
	256	json_file_path = json_file[1]
	257	json_file = os.fdopen( json_file[0], 'w' )
	258	for uploaded_dataset in uploaded_datasets:
	259	data = uploaded_dataset.data
	260	if uploaded_dataset.type == 'composite':
	261	# we need to init metadata before the job is dispatched
	262	data.init_meta()
	263	for meta_name, meta_value in uploaded_dataset.metadata.iteritems():
	264	setattr( data.metadata, meta_name, meta_value )
	265	trans.sa_session.add( data )
	266	trans.sa_session.flush()
	267	json = dict( file_type = uploaded_dataset.file_type,
	268	dataset_id = data.dataset.id,
	269	dbkey = uploaded_dataset.dbkey,
	270	type = uploaded_dataset.type,
	271	metadata = uploaded_dataset.metadata,
	272	primary_file = uploaded_dataset.primary_file,
	273	composite_file_paths = uploaded_dataset.composite_files,
	274	composite_files = dict( [ ( k, v.__dict__ ) for k, v in data.datatype.get_composite_files( data ).items() ] ) )
	275	else:
	276	try:
	277	is_binary = uploaded_dataset.datatype.is_binary
	278	except:
	279	is_binary = None
	280	try:
	281	link_data_only = uploaded_dataset.link_data_only
	282	except:
	283	link_data_only = False
	284	json = dict( file_type = uploaded_dataset.file_type,
	285	ext = uploaded_dataset.ext,
	286	name = uploaded_dataset.name,
	287	dataset_id = data.dataset.id,
	288	dbkey = uploaded_dataset.dbkey,
	289	type = uploaded_dataset.type,
	290	is_binary = is_binary,
	291	link_data_only = link_data_only,
	292	space_to_tab = uploaded_dataset.space_to_tab,
	293	path = uploaded_dataset.path )
	294	json_file.write( to_json_string( json ) + '\n' )
	295	json_file.close()
	296	return json_file_path
	297	def create_job( trans, params, tool, json_file_path, data_list, folder=None, return_job=False ):
	298	"""
	299	Create the upload job.
	300	"""
	301	job = trans.app.model.Job()
	302	galaxy_session = trans.get_galaxy_session()
	303	if type( galaxy_session ) == trans.model.GalaxySession:
	304	job.session_id = galaxy_session.id
	305	if trans.user is not None:
	306	job.user_id = trans.user.id
	307	if folder:
	308	job.library_folder_id = folder.id
	309	else:
	310	job.history_id = trans.history.id
	311	job.tool_id = tool.id
	312	job.tool_version = tool.version
	313	job.state = job.states.UPLOAD
	314	trans.sa_session.add( job )
	315	trans.sa_session.flush()
	316	log.info( 'tool %s created job id %d' % ( tool.id, job.id ) )
	317	trans.log_event( 'created job id %d' % job.id, tool_id=tool.id )
	318
	319	for name, value in tool.params_to_strings( params, trans.app ).iteritems():
	320	job.add_parameter( name, value )
	321	job.add_parameter( 'paramfile', to_json_string( json_file_path ) )
	322	if folder:
	323	for i, dataset in enumerate( data_list ):
	324	job.add_output_library_dataset( 'output%i' % i, dataset )
	325	else:
	326	for i, dataset in enumerate( data_list ):
	327	job.add_output_dataset( 'output%i' % i, dataset )
	328	job.state = job.states.NEW
	329	trans.sa_session.add( job )
	330	trans.sa_session.flush()
	331
	332	# Queue the job for execution
	333	trans.app.job_queue.put( job.id, tool )
	334	trans.log_event( "Added job to the job queue, id: %s" % str(job.id), tool_id=job.tool_id )
	335	output = odict()
	336	for i, v in enumerate( data_list ):
	337	output[ 'output%i' % i ] = v
	338	if return_job:
	339	return job, output
	340	else:
	341	return output
	342	def active_folders( trans, folder ):
	343	# Stolen from galaxy.web.controllers.library_common (importing from which causes a circular issues).
	344	# Much faster way of retrieving all active sub-folders within a given folder than the
	345	# performance of the mapper. This query also eagerloads the permissions on each folder.
	346	return trans.sa_session.query( trans.app.model.LibraryFolder ) \
	347	.filter_by( parent=folder, deleted=False ) \
	348	.options( eagerload_all( "actions" ) ) \
	349	.order_by( trans.app.model.LibraryFolder.table.c.name ) \
	350	.all()

Note: リポジトリブラウザについてのヘルプは TracBrowser を参照してください。

Context Navigation

root/galaxy-central/lib/galaxy/tools/actions/upload_common.py @ 2

異なるフォーマットでダウンロード: