1*d5c09012SAndroid Build Coastguard Worker// Copyright 2016 Google Inc. 2*d5c09012SAndroid Build Coastguard Worker// 3*d5c09012SAndroid Build Coastguard Worker// Licensed under the Apache License, Version 2.0 (the "License"); 4*d5c09012SAndroid Build Coastguard Worker// you may not use this file except in compliance with the License. 5*d5c09012SAndroid Build Coastguard Worker// You may obtain a copy of the License at 6*d5c09012SAndroid Build Coastguard Worker// 7*d5c09012SAndroid Build Coastguard Worker// http://www.apache.org/licenses/LICENSE-2.0 8*d5c09012SAndroid Build Coastguard Worker// 9*d5c09012SAndroid Build Coastguard Worker// Unless required by applicable law or agreed to in writing, software 10*d5c09012SAndroid Build Coastguard Worker// distributed under the License is distributed on an "AS IS" BASIS, 11*d5c09012SAndroid Build Coastguard Worker// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 12*d5c09012SAndroid Build Coastguard Worker// See the License for the specific language governing permissions and 13*d5c09012SAndroid Build Coastguard Worker// limitations under the License. 14*d5c09012SAndroid Build Coastguard Worker 15*d5c09012SAndroid Build Coastguard Workersyntax = "proto3"; 16*d5c09012SAndroid Build Coastguard Worker 17*d5c09012SAndroid Build Coastguard Workerpackage google.genomics.v1; 18*d5c09012SAndroid Build Coastguard Worker 19*d5c09012SAndroid Build Coastguard Workerimport "google/api/annotations.proto"; 20*d5c09012SAndroid Build Coastguard Worker 21*d5c09012SAndroid Build Coastguard Workeroption cc_enable_arenas = true; 22*d5c09012SAndroid Build Coastguard Workeroption go_package = "google.golang.org/genproto/googleapis/genomics/v1;genomics"; 23*d5c09012SAndroid Build Coastguard Workeroption java_multiple_files = true; 24*d5c09012SAndroid Build Coastguard Workeroption java_outer_classname = "CigarProto"; 25*d5c09012SAndroid Build Coastguard Workeroption java_package = "com.google.genomics.v1"; 26*d5c09012SAndroid Build Coastguard Worker 27*d5c09012SAndroid Build Coastguard Worker// A single CIGAR operation. 28*d5c09012SAndroid Build Coastguard Workermessage CigarUnit { 29*d5c09012SAndroid Build Coastguard Worker // Describes the different types of CIGAR alignment operations that exist. 30*d5c09012SAndroid Build Coastguard Worker // Used wherever CIGAR alignments are used. 31*d5c09012SAndroid Build Coastguard Worker enum Operation { 32*d5c09012SAndroid Build Coastguard Worker OPERATION_UNSPECIFIED = 0; 33*d5c09012SAndroid Build Coastguard Worker 34*d5c09012SAndroid Build Coastguard Worker // An alignment match indicates that a sequence can be aligned to the 35*d5c09012SAndroid Build Coastguard Worker // reference without evidence of an INDEL. Unlike the 36*d5c09012SAndroid Build Coastguard Worker // `SEQUENCE_MATCH` and `SEQUENCE_MISMATCH` operators, 37*d5c09012SAndroid Build Coastguard Worker // the `ALIGNMENT_MATCH` operator does not indicate whether the 38*d5c09012SAndroid Build Coastguard Worker // reference and read sequences are an exact match. This operator is 39*d5c09012SAndroid Build Coastguard Worker // equivalent to SAM's `M`. 40*d5c09012SAndroid Build Coastguard Worker ALIGNMENT_MATCH = 1; 41*d5c09012SAndroid Build Coastguard Worker 42*d5c09012SAndroid Build Coastguard Worker // The insert operator indicates that the read contains evidence of bases 43*d5c09012SAndroid Build Coastguard Worker // being inserted into the reference. This operator is equivalent to SAM's 44*d5c09012SAndroid Build Coastguard Worker // `I`. 45*d5c09012SAndroid Build Coastguard Worker INSERT = 2; 46*d5c09012SAndroid Build Coastguard Worker 47*d5c09012SAndroid Build Coastguard Worker // The delete operator indicates that the read contains evidence of bases 48*d5c09012SAndroid Build Coastguard Worker // being deleted from the reference. This operator is equivalent to SAM's 49*d5c09012SAndroid Build Coastguard Worker // `D`. 50*d5c09012SAndroid Build Coastguard Worker DELETE = 3; 51*d5c09012SAndroid Build Coastguard Worker 52*d5c09012SAndroid Build Coastguard Worker // The skip operator indicates that this read skips a long segment of the 53*d5c09012SAndroid Build Coastguard Worker // reference, but the bases have not been deleted. This operator is commonly 54*d5c09012SAndroid Build Coastguard Worker // used when working with RNA-seq data, where reads may skip long segments 55*d5c09012SAndroid Build Coastguard Worker // of the reference between exons. This operator is equivalent to SAM's 56*d5c09012SAndroid Build Coastguard Worker // `N`. 57*d5c09012SAndroid Build Coastguard Worker SKIP = 4; 58*d5c09012SAndroid Build Coastguard Worker 59*d5c09012SAndroid Build Coastguard Worker // The soft clip operator indicates that bases at the start/end of a read 60*d5c09012SAndroid Build Coastguard Worker // have not been considered during alignment. This may occur if the majority 61*d5c09012SAndroid Build Coastguard Worker // of a read maps, except for low quality bases at the start/end of a read. 62*d5c09012SAndroid Build Coastguard Worker // This operator is equivalent to SAM's `S`. Bases that are soft 63*d5c09012SAndroid Build Coastguard Worker // clipped will still be stored in the read. 64*d5c09012SAndroid Build Coastguard Worker CLIP_SOFT = 5; 65*d5c09012SAndroid Build Coastguard Worker 66*d5c09012SAndroid Build Coastguard Worker // The hard clip operator indicates that bases at the start/end of a read 67*d5c09012SAndroid Build Coastguard Worker // have been omitted from this alignment. This may occur if this linear 68*d5c09012SAndroid Build Coastguard Worker // alignment is part of a chimeric alignment, or if the read has been 69*d5c09012SAndroid Build Coastguard Worker // trimmed (for example, during error correction or to trim poly-A tails for 70*d5c09012SAndroid Build Coastguard Worker // RNA-seq). This operator is equivalent to SAM's `H`. 71*d5c09012SAndroid Build Coastguard Worker CLIP_HARD = 6; 72*d5c09012SAndroid Build Coastguard Worker 73*d5c09012SAndroid Build Coastguard Worker // The pad operator indicates that there is padding in an alignment. This 74*d5c09012SAndroid Build Coastguard Worker // operator is equivalent to SAM's `P`. 75*d5c09012SAndroid Build Coastguard Worker PAD = 7; 76*d5c09012SAndroid Build Coastguard Worker 77*d5c09012SAndroid Build Coastguard Worker // This operator indicates that this portion of the aligned sequence exactly 78*d5c09012SAndroid Build Coastguard Worker // matches the reference. This operator is equivalent to SAM's `=`. 79*d5c09012SAndroid Build Coastguard Worker SEQUENCE_MATCH = 8; 80*d5c09012SAndroid Build Coastguard Worker 81*d5c09012SAndroid Build Coastguard Worker // This operator indicates that this portion of the aligned sequence is an 82*d5c09012SAndroid Build Coastguard Worker // alignment match to the reference, but a sequence mismatch. This can 83*d5c09012SAndroid Build Coastguard Worker // indicate a SNP or a read error. This operator is equivalent to SAM's 84*d5c09012SAndroid Build Coastguard Worker // `X`. 85*d5c09012SAndroid Build Coastguard Worker SEQUENCE_MISMATCH = 9; 86*d5c09012SAndroid Build Coastguard Worker } 87*d5c09012SAndroid Build Coastguard Worker 88*d5c09012SAndroid Build Coastguard Worker Operation operation = 1; 89*d5c09012SAndroid Build Coastguard Worker 90*d5c09012SAndroid Build Coastguard Worker // The number of genomic bases that the operation runs for. Required. 91*d5c09012SAndroid Build Coastguard Worker int64 operation_length = 2; 92*d5c09012SAndroid Build Coastguard Worker 93*d5c09012SAndroid Build Coastguard Worker // `referenceSequence` is only used at mismatches 94*d5c09012SAndroid Build Coastguard Worker // (`SEQUENCE_MISMATCH`) and deletions (`DELETE`). 95*d5c09012SAndroid Build Coastguard Worker // Filling this field replaces SAM's MD tag. If the relevant information is 96*d5c09012SAndroid Build Coastguard Worker // not available, this field is unset. 97*d5c09012SAndroid Build Coastguard Worker string reference_sequence = 3; 98*d5c09012SAndroid Build Coastguard Worker} 99