Schema

	A	B	C	D	E	F	G	H	I	J	K	L	M	N	O
1	NCBI/JSON
2	NCBI/JSON
3	attrs									datatype	sample	flatJSON	essential	description (https://api.ncbi.nlm.nih.gov/variation/v0/#/)	note
4	d1	d2	d3	d4	d5	d6	d6	d8	d9	datatype	sample	flatJSON	essential	description (https://api.ncbi.nlm.nih.gov/variation/v0/#/)	note
5	refsnp_id									str/int	"268"	refsnp_id		A 64 bit positive integer that is uniquely and forever assigned to this RefSNP object
6	create_date									timestamp	"2000-09-19T17:02Z"	create_date		The date the RefSNP was created
7	last_update_date									timestamp	"2018-10-12T12:02Z"	last_update_date		The date the RefSNP was last updated or create_date if never updated
8	last_update_build_id									str/int	"152"	last_update_build_id		The id of the last dbSNP build in which this RefSNP was created or updated
9	dbsnp1_merges									COMPLEX LIST		dbsnp1_merges		Record of one RefSNP merging into another. Due to curatorial changes or a change in input alignment data sets, a RefSNP may change anchor such that it now coincides with second RefSNP. Only one 'live' RefSNP is allowed at a given anchor. To resolve this conflict, dbSNP chooses one RefSNP as 'live', and merges the data from the other RefSNP into it. dbSNP gives preference to the clinical RefSNP and if that is not sufficient it chooses the oldest RefSNP, the one with the lowest ID.	this field is for dbsnp1 merge only. Record of each time another RefSNP objects merged into this RefSNP because the RsAnchors of each were the same. If the recipient of a merge then merges into yet a third RefSNP, the list is flattened.
10		merged_rsid								str/int	"17850737"	merged_rsid		The RefSNP ID of the RefSNP object that was merged into the now live RefSNP
11		revision								str/int	"126"	revision		The revision in which the merge took place
12		merge_date								timestamp	"2006-03-11T06:16Z"	merge_date		The date and time the RefSNP was merged
13	citations									list(int)	[8541837, 17357073]	citations		Set of PubMed IDs (PMIDs) for this RefSNP or its supporting submissions
14	lost_obs_movements									list(?)	[]	lost_obs_movements		For recording the movement of an observation that was in this RefSNP in the previous release, but no longer in the current
15	present_obs_movements									COMPLEX LIST		present_obs_movements		The record of movements between the previous and current release for observations mapped to this RefSNP by the Alignment Data Set used in this release
16		component_ids								COMPLEX LIST		component_ids		DbSnpIds of the supporting data where this particular observation is found (SubSnpId, ClinVarSnpId, etc.
17			type							str	"subsnp"	type		[ subsnp, frequency, clinvar ] - The kind of supporting data. This list can expand.
18			value							str/int	"3643680166"	value		The submitted variant ID.
19		observation								OBJECT		observation		A single contextual allele in SPDI notation. Contextual allele means that applying the Blossom Precision Correction Algorithm would leave the fields unchanged.
20			seq_id							str	"NC_000008.9"	seq_id		The RefSeq/Genbank Accession.Version for the reference sequence
21			position							int	19956017	position		The 0-based boundary position where the deletion starts. That is, position 0 starts the deletion immediately before the first nucleotide and position 1 starts the deletion between the first and second nucleotides.
22			deleted_sequence							str	"A"	deleted_sequence		The IUPAC sequence of nucleotides/amino-acids to delete from the reference. This can be empty, which is how a pure insertion is represented.
23			inserted_sequence							str	"A"	inserted_sequence		The IUPAC sequence of nucleotides/amino-acids to insert after perforing the deletion. Amino-acids use the single character encoding. All nucleotide codes including the ones for ambiguity are allowed.
24		allele_in_cur_release								OBJECT		allele_in_cur_release		-
25			seq_id							str	"NC_000008.11"	seq_id		-
26			position							int	19956017	position		-
27			deleted_sequence							str	"A"	deleted_sequence		-
28			inserted_sequence							str	"A"	inserted_sequence		-
29		other_rsids_in_cur_release								list(?)	[]	other_rsids_in_cur_release		The RSIDs of any other RefSnps that contain this observation in the current release. Can only be non-empty for the identity allele.
30		previous_release								OBJECT		previous_release		The characteristics of an observation that allow one to find it in the previous release. Should only be used when the observation described was present in the previous release.
31			allele							OBJECT		allele		A single contextual allele in SPDI notation. Contextual allele means that applying the Blossom Precision Correction Algorithm would leave the fields unchanged.
32				seq_id						str	"NC_000008.10"	seq_id		-
33				position						int	19813528	position		-
34				deleted_sequence						str	"A"	deleted_sequence		-
35				inserted_sequence						str	"A"	inserted_sequence		-
36			rsids							list(str)	["268"]	rsids		The ids of the RefSnps that contained a particular observation in the previous release. Only identity alleles can belong to more than one RefSnp, so this can only have more than one entry if the observation maps to the identity allele. The PreviousRelease struct should only be used when the observation was present in the previous release, so this field should not be empty.
37		last_added_to_this_rs								str/int	"151"	last_added_to_this_rs		The most recent release in which this observation started being associated with this RSID. If the historical membership for this observation is release1:rs1 release2:rs2 release3:rs1 release4:rs1, this will hold "release3". Note that because of a change to the dbSNP data model between builds 151 and 152, if the most recent release is prior to 152 then the observation may have been added to this RefSNP before the build listed. For example, if it says 140, it is possible that it was really added in 130. But it cannot have been added after build 140. If it says 152, then it was last added in build 152 and not before or after that.
38	primary_snapshot_data									OBJECT		primary_snapshot_data		Data specific to primary snapshots; cannot be present at the same time as merged_snapshot_data or nosnppos_snapshot_data
39		placements_with_allele								COMPLEX LIST		placements_with_allele		List of all placements, each containing a list of the alleles in the context of that reference region. Includes both nucleotide and protein placements. For all placements, the list of alleles is the same length and in the same order. They represent the alleles on the preferred top level placement (PTLP) in sorted order. So, on a given placement, the first allele is how the first allele on the PTLP appears upon mapping to the given placement. Similarly for the second allele, and so on.	For nucleotide placements, each allele in this placement is stored as a SPDI. Each SPDI contains a reference sequence identifier. For the set of alleles in SPDI syntax, they must all have the same reference sequence identifier, that matches the seq_id attribute. For protein placements, the allele is either in SPDI syntax, or gives a general description of a frameshift.
40			seq_id							str	"NC_000008.11"	seq_id		-
41			is_ptlp							bool	TRUE	is_ptlp		True if this placement is the preferred top level placement (PTLP) under the alignment data set which generated this RefSnp cluster
42			placement_annot							OBJECT		placement_annot		Annotation about this sequence
43				seq_type						str / ENUM	"refseq_chromosome"	seq_type		[ refseq_chromosome, refseq_contig, gpipe_chromosome, contig, refseq_genomic, refseq_mrna, refseq_mrna_pred, mrna, refseq_ncrna, refseq_ncrna_pred, ncrna, refseq_prot, genbank, embl, ddbj ]	The associated sequence's type
44				mol_type						str	"genomic"	mol_type		[ unknown, genomic, rna, protein, mitochondrion, nucleic_acid ]
45				seq_id_traits_by_assembly						COMPLEX LIST		seq_id_traits_by_assembly		-
46					assembly_name					str	"GRCh38.p12"	assembly_name		-
47					assembly_accession					str	"GCF_000001405.38"	assembly_accession		-
48					is_top_level					bool	TRUE	is_top_level		-
49					is_alt					bool	FALSE	is_alt		-
50					is_patch					bool	FALSE	is_patch		-
51					is_chromosome					bool	TRUE	is_chromosome		-
52				is_aln_opposite_orientation						bool	FALSE	is_aln_opposite_orientation		True if this sequence is aligned reverse to the PTLP sequence. Thus, the PTLP sequence's is_aln_opposite_orientation attribute is always false.
53				is_mismatch						bool	FALSE	is_mismatch		True if this sequence's residues are different than the PTLP sequence at this locus. Thus, the PTLP sequence's is_mismatch attribute is always false
54			alleles							COMPLEX LIST		alleles		-
55				allele						OBJECT		allele		A RefSnp can describe 1 to N alleles. While for the PTLP, all alleles (in SPDI syntax) are the same type and length, non-PTLP Placements (i.e. all other Placements), the allele in SPDI syntax may have different types, lengths and start positions, and in some rare cases, may not even overlap. But they are all on this placement's Sequence.
56					spdi					OBJECT		spdi		-
57						seq_id				str	"NC_000008.11"	seq_id		-
58						position				int	19956017	position		-
59						deleted_sequence				str	"A"	deleted_sequence		-
60						inserted_sequence str				str	"A"	inserted_sequence		-
61				hgvs						str	"NC_000008.11:g.19956018A="	hgvs		-
62		allele_annotations								COMPLEX LIST		allele_annotations		Each element holds the annotations associated with a particular variant. This list of annotation lists has the same order and length as the list of alleles in each placement. This order associates each allele with its corresponding annotation list. If an allele was not associated with any annotations, the corresponding annotation set will have only empty lists.
63			frequency							COMPLEX LIST		frequency		-
64				study_name						str	"1000Genomes"	study_name		-
65				study_version						int	1	study_version		-
66				local_row_id						int	41009890	local_row_id		-
67				observation						OBJECT		observation		-
68					seq_id					str	"NC_000008.10"	seq_id		-
69					position					int	19813528	position		-
70					deleted_sequence					str	"A"	deleted_sequence		-
71					inserted_sequence					str	"G"	inserted_sequence		-
72				allele_count						int	26	allele_count		-
73				total_count						int	5008	total_count		-
74			clinical							COMPLEX LIST		clinical		-
75				accession_version						str	"RCV000001615.2"	accession_version		-
76				allele_id						int	16589	allele_id		-
77				measure_set_id						int	1550	measure_set_id		-
78				variant_identifiers						COMPLEX LIST		variant_identifiers		-
79					organization					str	"UniProtKB"	organization		-
80					accession					str	"P06858#VAR_004239"	accession		-
81				refsnp_id						str	"268"	refsnp_id		-
82				create_date						timestamp	"2012-08-13T00:00Z"	create_date		-
83				update_date						timestamp	"2018-07-21T00:00Z"	update_date		-
84				last_evaluated_date						timestamp	"2017-12-3T00:00Z"	last_evaluated_date		-
85				review_status						str	"criteria_provided_single_submitter"	review_status		-
86				disease_names						list(str)	["Hyperapobetalipoproteinemia"]	disease_names		-
87				clinical_significances						list(str)	["pathogenic"]	clinical_significances		-
88				disease_ids						COMPLEX LIST		disease_ids		-
89					organization					str	"GeneReviews"	organization		-
90					accession					str	"NBK208534"	accession		-
91				origins						list(str)	["germline","inherited"]	origins		-
92				collection_method						list(str)	["clinical-testing", "literature-only"]	collection_method		-
93				citations						list(int)	[8541837]	citations		-
94				gene_ids						list(str)	["4023"]	gene_ids		-
95			submissions							list(str)	["268", "23712753", "28505039"]	submissions		-
96			assembly_annotation							COMPLEX LIST		assembly_annotation		-
97				seq_id						str	"NC_000008.11"	seq_id		-
98				annotation_release						str	"Homo sapiens Annotation Release 109"	annotation_release		-
99				genes						COMPLEX LIST		genes		-
100					name					str	"lipoprotein lipase"	name		-