File: good_repertoire.yaml

package info (click to toggle)
python-airr 1.5.1-2
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 684 kB
  • sloc: python: 2,407; sh: 19; makefile: 10
file content (379 lines) | stat: -rw-r--r-- 15,221 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
#
# Example metadata
#

Repertoire:
  - repertoire_id: 1841923116114776551-242ac11c-0001-012
    study:
      study_id: PRJNA300878
      study_title: "Homo sapiens B and T cell repertoire - MZ twins"
      study_type:
        id: null
        label: null
      study_description: "The adaptive immune system's capability to protect the body requires a highly diverse lymphocyte antigen receptor repertoire. However, the influence of individual genetic and epigenetic differences on these repertoires is not typically measured. By leveraging the unique characteristics of B, CD4+ T, and CD8+ T lymphocyte subsets isolated from monozygotic twins, we have quantified the impact of heritable factors on both the V(D)J recombination process and thymic selection in the case of T cell receptors, and show that the repertoires of both naive and antigen experienced cells are subject to biases resulting from differences in recombination. We show that biases in V(D)J usage, as well as biased N/P additions, contribute to significant variation in the CDR3 region. Moreover, we show that the relative usage of V and J gene segments is chromosomally biased, with approximately 1.5 times as many rearrangements originating from a single chromosome. These data refine our understanding of the heritable mechanisms affecting the repertoire, and show that biases are evident on a chromosome-wide level."
      study_contact: "Mark M. Davis,  mmdavis@stanford.edu, ORCID:0000-0001-6868-657X"
      inclusion_exclusion_criteria: null
      lab_name: "Mark M. Davis"
      lab_address: "Stanford University"
      submitted_by: "Florian Rubelt"
      pub_ids: "PMID:27005435"
      collected_by: null
      grants: null
      keywords_study: 
        - "contains_ig"
        - "contains_tr"
    subject:
      subject_id: TW01A
      synthetic: false
      species:
        id: "NCBITaxon_9606"
        label: "Homo sapiens"
      sex: female
      age_min: 27
      age_max: 27
      age_unit:
        id: UO_0000036
        label: year
      age_event: null
      ancestry_population: null
      ethnicity: null
      race: null
      strain_name: null
      linked_subjects: TW01B
      link_type: twin
      diagnosis:
        - study_group_description: null
          disease_diagnosis:
            id: null
            label: null
          disease_length: null
          disease_stage: null
          prior_therapies: null
          immunogen: null
          intervention: null
          medical_history: null

    sample:
      - sample_id: TW01A_B_naive
        sample_processing_id: null
        sample_type: "peripheral venous puncture"
        tissue:
          id: "UBERON_0000178"
          label: "blood"
        tissue_processing: "Ficoll gradient"
        cell_subset:
          id: "CL_0000788"
          label: "naive B cell"
        cell_phenotype: "expression of CD20 and the absence of CD27"
        cell_species:
          id: "NCBITaxon_9606"
          label: "Homo sapiens"
        single_cell: false
        cell_isolation: FACS
        template_class: RNA
        pcr_target:
          - pcr_target_locus: IGH
            forward_pcr_primer_target_location: null
            reverse_pcr_primer_target_location: null
        sequencing_platform: "Illumina MiSeq"
        sequencing_files:
          sequencing_data_id: SRA:SRR2905656
          file_type: fastq
          filename: SRR2905656_R1.fastq.gz
          read_direction: forward
          read_length: 300
          paired_filename: SRR2905656_R2.fastq.gz
          paired_read_direction: reverse
          paired_read_length: 300
          index_filename: SRR2905656_R3.fastq.gz
          index_length: 8
        anatomic_site: null
        disease_state_sample: null
        collection_time_point_relative: null
        collection_time_point_relative_unit:
          id: null
          label: null
        collection_time_point_reference: null
        biomaterial_provider: null
        cell_number: null
        cells_per_reaction: null
        cell_storage: false
        cell_quality: null
        cell_processing_protocol: null
        template_quality: null
        template_amount: null
        template_amount_unit:
          id: null
          label: null
        library_generation_method: "RT(oligo-dT)+PCR"
        library_generation_protocol: null
        library_generation_kit_version: null
        complete_sequences: "partial"
        physical_linkage: "none"
        sequencing_run_id: null
        total_reads_passing_qc_filter: null
        sequencing_facility: null
        sequencing_run_date: null
        sequencing_kit: null
    data_processing:
      - data_processing_id: 3059369183532618216-242ac11b-0001-007
        primary_annotation: true
        software_versions: null
        paired_reads_assembly: null
        quality_thresholds: null
        primer_match_cutoffs: null
        collapsing_method: null
        data_processing_protocols: null
        data_processing_files: null
        germline_database: null
        analysis_provenance_id: 6623294219256599016-242ac11c-0001-012

  - repertoire_id: 1602908186092376551-242ac11c-0001-012
    study:
      study_id: PRJNA300878
      study_title: "Homo sapiens B and T cell repertoire - MZ twins"
      study_type:
        id: null
        label: null
      study_description: "The adaptive immune system's capability to protect the body requires a highly diverse lymphocyte antigen receptor repertoire. However, the influence of individual genetic and epigenetic differences on these repertoires is not typically measured. By leveraging the unique characteristics of B, CD4+ T, and CD8+ T lymphocyte subsets isolated from monozygotic twins, we have quantified the impact of heritable factors on both the V(D)J recombination process and thymic selection in the case of T cell receptors, and show that the repertoires of both naive and antigen experienced cells are subject to biases resulting from differences in recombination. We show that biases in V(D)J usage, as well as biased N/P additions, contribute to significant variation in the CDR3 region. Moreover, we show that the relative usage of V and J gene segments is chromosomally biased, with approximately 1.5 times as many rearrangements originating from a single chromosome. These data refine our understanding of the heritable mechanisms affecting the repertoire, and show that biases are evident on a chromosome-wide level."
      study_contact: "Mark M. Davis,  mmdavis@stanford.edu, ORCID:0000-0001-6868-657X"
      inclusion_exclusion_criteria: null
      lab_name: "Mark M. Davis"
      lab_address: "Stanford University"
      submitted_by: "Florian Rubelt"
      pub_ids: "PMID:27005435"
      collected_by: null
      grants: null
      keywords_study:
        - "contains_ig"
        - "contains_tr"
    subject:
      subject_id: TW01A
      synthetic: false
      species:
        id: "NCBITaxon_9606"
        label: "Homo sapiens"
      sex: female
      age_min: 27
      age_max: 27
      age_unit:
        id: UO_0000036
        label: year
      age_event: null
      ancestry_population: null
      ethnicity: null
      race: null
      strain_name: null
      linked_subjects: TW01B
      link_type: twin
      diagnosis:
        - study_group_description: null
          disease_diagnosis:
            id: null
            label: null
          disease_length: null
          disease_stage: null
          prior_therapies: null
          immunogen: null
          intervention: null
          medical_history: null

    sample:
      - sample_id: TW01A_B_memory
        sample_processing_id: null
        sample_type: "peripheral venous puncture"
        tissue:
          id: "UBERON_0000178"
          label: "blood"
        tissue_processing: "Ficoll gradient"
        cell_subset:
          id: "CL_0000787"
          label: "memory B cell"
        cell_phenotype: "expression of CD20 and CD27"
        cell_species:
          id: "NCBITaxon_9606"
          label: "Homo sapiens"
        single_cell: false
        cell_isolation: FACS
        template_class: RNA
        pcr_target:
          - pcr_target_locus: IGH
            forward_pcr_primer_target_location: null
            reverse_pcr_primer_target_location: null
        sequencing_platform: "Illumina MiSeq"
        sequencing_files:
          sequencing_data_id: SRA:SRR2905655
          file_type: fastq
          filename: SRR2905655_R1.fastq.gz
          read_direction: forward
          read_length: 300
          paired_filename: SRR2905655_R2.fastq.gz
          paired_read_direction: reverse
          paired_read_length: 300
          index_filename: SRR2905655_R3.fastq.gz
          index_length: 8
        anatomic_site: null
        disease_state_sample: null
        collection_time_point_relative: null
        collection_time_point_relative_unit:
          id: null
          label: null
        collection_time_point_reference: null
        biomaterial_provider: null
        cell_number: null
        cells_per_reaction: null
        cell_storage: false
        cell_quality: null
        cell_processing_protocol: null
        template_quality: null
        template_amount: null
        template_amount_unit:
          id: null
          label: null
        library_generation_method: "RT(oligo-dT)+PCR"
        library_generation_protocol: null
        library_generation_kit_version: null
        complete_sequences: "partial"
        physical_linkage: "none"
        sequencing_run_id: null
        total_reads_passing_qc_filter: null
        sequencing_facility: null
        sequencing_run_date: null
        sequencing_kit: null
    data_processing:
      - data_processing_id: 3059369183532618216-242ac11b-0001-007
        primary_annotation: true
        software_versions: null
        paired_reads_assembly: null
        quality_thresholds: null
        primer_match_cutoffs: null
        collapsing_method: null
        data_processing_protocols: null
        data_processing_files: null
        germline_database: null
        analysis_provenance_id: 6623294219256599016-242ac11c-0001-012

  - repertoire_id: 2366080924918616551-242ac11c-0001-012
    study:
      study_id: PRJNA300878
      study_title: "Homo sapiens B and T cell repertoire - MZ twins"
      study_type:
        id: null
        label: null
      study_description: "The adaptive immune system's capability to protect the body requires a highly diverse lymphocyte antigen receptor repertoire. However, the influence of individual genetic and epigenetic differences on these repertoires is not typically measured. By leveraging the unique characteristics of B, CD4+ T, and CD8+ T lymphocyte subsets isolated from monozygotic twins, we have quantified the impact of heritable factors on both the V(D)J recombination process and thymic selection in the case of T cell receptors, and show that the repertoires of both naive and antigen experienced cells are subject to biases resulting from differences in recombination. We show that biases in V(D)J usage, as well as biased N/P additions, contribute to significant variation in the CDR3 region. Moreover, we show that the relative usage of V and J gene segments is chromosomally biased, with approximately 1.5 times as many rearrangements originating from a single chromosome. These data refine our understanding of the heritable mechanisms affecting the repertoire, and show that biases are evident on a chromosome-wide level."
      study_contact: "Mark M. Davis,  mmdavis@stanford.edu, ORCID:0000-0001-6868-657X"
      inclusion_exclusion_criteria: null
      lab_name: "Mark M. Davis"
      lab_address: "Stanford University"
      submitted_by: "Florian Rubelt"
      pub_ids: "PMID:27005435"
      collected_by: null
      grants: null
      keywords_study:
        - "contains_ig"
        - "contains_tr"
    subject:
      subject_id: TW01A
      synthetic: false
      species:
        id: "NCBITaxon_9606"
        label: "Homo sapiens"
      sex: female
      age_min: 27
      age_max: 27
      age_unit:
        id: UO_0000036
        label: year
      age_event: null
      ancestry_population: null
      ethnicity: null
      race: null
      strain_name: null
      linked_subjects: TW01B
      link_type: twin
      diagnosis:
        - study_group_description: null
          disease_diagnosis:
            id: null
            label: null
          disease_length: null
          disease_stage: null
          prior_therapies: null
          immunogen: null
          intervention: null
          medical_history: null

    sample:
      - sample_id: TW01A_T_naive_CD4
        sample_processing_id: null
        sample_type: "peripheral venous puncture"
        tissue:
          id: "UBERON_0000178"
          label: "blood"
        tissue_processing: "Ficoll gradient"
        cell_subset:
          id: "CL_0000895"
          label: "naive thymus-derived CD4-positive, alpha-beta T cell"
        cell_phenotype: "expression of CD8 and absence of CD4 and CD45RO"
        cell_species:
          id: "NCBITaxon_9606"
          label: "Homo sapiens"
        single_cell: false
        cell_isolation: FACS
        template_class: RNA
        pcr_target:
          - pcr_target_locus: TRB
            forward_pcr_primer_target_location: null
            reverse_pcr_primer_target_location: null
        sequencing_platform: "Illumina MiSeq"
        sequencing_files:
          sequencing_data_id: SRA:SRR2905659
          file_type: fastq
          filename: SRR2905659_R1.fastq.gz
          read_direction: forward
          read_length: 300
          paired_filename: SRR2905659_R2.fastq.gz
          paired_read_direction: reverse
          paired_read_length: 300
          index_filename: SRR2905659_R3.fastq.gz
          index_length: 8
        anatomic_site: null
        disease_state_sample: null
        collection_time_point_relative: null
        collection_time_point_relative_unit:
          id: null
          label: null
        collection_time_point_reference: null
        biomaterial_provider: null
        cell_number: null
        cells_per_reaction: null
        cell_storage: false
        cell_quality: null
        cell_processing_protocol: null
        template_quality: null
        template_amount: null
        template_amount_unit:
          id: null
          label: null
        library_generation_method: "RT(oligo-dT)+PCR"
        library_generation_protocol: null
        library_generation_kit_version: null
        complete_sequences: "partial"
        physical_linkage: "none"
        sequencing_run_id: null
        total_reads_passing_qc_filter: null
        sequencing_facility: null
        sequencing_run_date: null
        sequencing_kit: null
    data_processing:
      - data_processing_id: 651223970338378216-242ac11b-0001-007
        primary_annotation: true
        software_versions: null
        paired_reads_assembly: null
        quality_thresholds: null
        primer_match_cutoffs: null
        collapsing_method: null
        data_processing_protocols: null
        data_processing_files: null
        germline_database: null
        analysis_provenance_id: 4625424004665971176-242ac11c-0001-012