sequencingSourceFile_column_name	description	data_type	multi	choice	range	choice_options	range_lower	range_upper	mandatory	unique
poseidon_IDs	Poseidon_IDs (in the .janno file) the sequencing entity corresponds to, multiple entries separated by ;	String	TRUE	FALSE	FALSE				FALSE	FALSE
udg	udg treatment applied to the library for the sequencing entity	String	FALSE	TRUE	FALSE	minus;half;plus			FALSE	FALSE
library_built	library preparation method applied for the sequencing entity (single- or double-stranded)	String	FALSE	TRUE	FALSE	ds;ss			FALSE	FALSE
sample_accession	sample accession code as used in the INSDC databases (including ENA and SRA) to identify the sequencing entity (e.g. SAMEA7050454)	String	FALSE	FALSE	FALSE				FALSE	FALSE
study_accession	study accession code as used in the INSDC databases (e.g. PRJEB39316)	String	FALSE	FALSE	FALSE				FALSE	FALSE
run_accession	run accession code as used in the INSDC databases (e.g. ERR4331996), this should be a unique identifier in a Poseidon package	String	FALSE	FALSE	FALSE				FALSE	FALSE
sample_alias	sample alias defined by the submitter in the raw sequencing data repository	String	FALSE	FALSE	FALSE				FALSE	FALSE
secondary_sample_accession	a secondary sample accession, used in the ENA database for historical reasons (e.g. ERS4811084)	String	FALSE	FALSE	FALSE				FALSE	FALSE
first_public	date (YYYY-MM-DD) the sequencing entity was first made public in the raw sequencing data repository	Date	FALSE	FALSE	FALSE				FALSE	FALSE
last_updated	date (YYYY-MM-DD) the sequencing entity was last updated in the raw sequencing data repository	Date	FALSE	FALSE	FALSE				FALSE	FALSE
instrument_model	name of the instrument used to process the sequencing entity (e.g. Illumina HiSeq 2500)	String	FALSE	FALSE	FALSE				FALSE	FALSE
library_layout	library layout of the sequencing entity (e.g. SINGLE)	String	FALSE	FALSE	FALSE				FALSE	FALSE
library_source	source of the DNA library (e.g. GENOMIC)	String	FALSE	FALSE	FALSE				FALSE	FALSE
instrument_platform	platform, brand or type of the sequencer (e.g. ILLUMINA)	String	FALSE	FALSE	FALSE				FALSE	FALSE
library_name	library identifier, so library name the submitter has entered to the raw sequencing data repository, data entries across which optical duplicates could exist should have matching library names	String	FALSE	FALSE	FALSE				FALSE	FALSE
library_strategy	strategy used to create the library for the sequencing entity (e.g. WGS)	String	FALSE	FALSE	FALSE				FALSE	FALSE
fastq_ftp	ftp links to the FASTQ files for the sequencing entity in the raw sequencing data repository (e.g. ftp.sra.ebi.ac.uk/vol1/fastq/ERR433/009/ ERR4332639/ERR4332639.fastq.gz), multiple entries separated by ;	URL	TRUE	FALSE	FALSE				FALSE	FALSE
fastq_aspera	aspera links to the FASTQ files for the sequencing entity in the raw sequencing data repository (e.g. fasp.sra.ebi.ac.uk:/vol1/fastq/ERR433/009/ ERR4332639/ERR4332639.fastq.gz), multiple entries separated by ;	URL	TRUE	FALSE	FALSE				FALSE	FALSE
fastq_bytes	number of bytes in the FASTQ files, multiple entries separated by ;, must be in the same order as the ftp and/or aspera links	Integer	TRUE	FALSE	TRUE		0	Inf	FALSE	FALSE
fastq_md5	md5 hashes of the FASTQ files, multiple entries separated by ;, must be in the same order as the ftp and/or aspera links	String	TRUE	FALSE	FALSE				FALSE	FALSE
read_count	number of reads in the sequencing entity	Integer	FALSE	FALSE	TRUE		0	Inf	FALSE	FALSE
submitted_ftp	urls to the originally submitted files before they got converted to FASTQ in the INSDC databases, multiple entries separated by ;	String	TRUE	FALSE	FALSE				FALSE	FALSE