readgroup.proto 3.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105
  1. // Copyright 2016 Google Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. syntax = "proto3";
  15. package google.genomics.v1;
  16. import "google/api/annotations.proto";
  17. import "google/protobuf/struct.proto";
  18. option cc_enable_arenas = true;
  19. option go_package = "google.golang.org/genproto/googleapis/genomics/v1;genomics";
  20. option java_multiple_files = true;
  21. option java_outer_classname = "ReadGroupProto";
  22. option java_package = "com.google.genomics.v1";
  23. // A read group is all the data that's processed the same way by the sequencer.
  24. message ReadGroup {
  25. message Experiment {
  26. // A client-supplied library identifier; a library is a collection of DNA
  27. // fragments which have been prepared for sequencing from a sample. This
  28. // field is important for quality control as error or bias can be introduced
  29. // during sample preparation.
  30. string library_id = 1;
  31. // The platform unit used as part of this experiment, for example
  32. // flowcell-barcode.lane for Illumina or slide for SOLiD. Corresponds to the
  33. // @RG PU field in the SAM spec.
  34. string platform_unit = 2;
  35. // The sequencing center used as part of this experiment.
  36. string sequencing_center = 3;
  37. // The instrument model used as part of this experiment. This maps to
  38. // sequencing technology in the SAM spec.
  39. string instrument_model = 4;
  40. }
  41. message Program {
  42. // The command line used to run this program.
  43. string command_line = 1;
  44. // The user specified locally unique ID of the program. Used along with
  45. // `prevProgramId` to define an ordering between programs.
  46. string id = 2;
  47. // The display name of the program. This is typically the colloquial name of
  48. // the tool used, for example 'bwa' or 'picard'.
  49. string name = 3;
  50. // The ID of the program run before this one.
  51. string prev_program_id = 4;
  52. // The version of the program run.
  53. string version = 5;
  54. }
  55. // The server-generated read group ID, unique for all read groups.
  56. // Note: This is different than the @RG ID field in the SAM spec. For that
  57. // value, see [name][google.genomics.v1.ReadGroup.name].
  58. string id = 1;
  59. // The dataset to which this read group belongs.
  60. string dataset_id = 2;
  61. // The read group name. This corresponds to the @RG ID field in the SAM spec.
  62. string name = 3;
  63. // A free-form text description of this read group.
  64. string description = 4;
  65. // A client-supplied sample identifier for the reads in this read group.
  66. string sample_id = 5;
  67. // The experiment used to generate this read group.
  68. Experiment experiment = 6;
  69. // The predicted insert size of this read group. The insert size is the length
  70. // the sequenced DNA fragment from end-to-end, not including the adapters.
  71. int32 predicted_insert_size = 7;
  72. // The programs used to generate this read group. Programs are always
  73. // identical for all read groups within a read group set. For this reason,
  74. // only the first read group in a returned set will have this field
  75. // populated.
  76. repeated Program programs = 10;
  77. // The reference set the reads in this read group are aligned to.
  78. string reference_set_id = 11;
  79. // A map of additional read group information. This must be of the form
  80. // map<string, string[]> (string key mapping to a list of string values).
  81. map<string, google.protobuf.ListValue> info = 12;
  82. }