Class: Merger
- Inherits:
-
Object
- Object
- Merger
- Defined in:
- lib/nugen_barcode_splitter/merger.rb
Instance Attribute Summary collapse
-
#sample_ids ⇒ Object
Returns the value of attribute sample_ids.
Instance Method Summary collapse
-
#initialize(fwd, rev, outdir, number, barcodes) ⇒ Merger
constructor
A new instance of Merger.
- #make_stats(statistics) ⇒ Object
- #merge ⇒ Object
Constructor Details
#initialize(fwd, rev, outdir, number, barcodes) ⇒ Merger
Returns a new instance of Merger.
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
# File 'lib/nugen_barcode_splitter/merger.rb', line 4 def initialize(fwd,rev,outdir,number,) # get sampleID @sample_ids = [] i = 0 File.open().each do |line| next if line.include?("#") line = line.split(" ") @sample_ids[i] = line[0] i += 1 end @fwd = fwd @rev = rev @outdir = outdir @number = number end |
Instance Attribute Details
#sample_ids ⇒ Object
Returns the value of attribute sample_ids.
20 21 22 |
# File 'lib/nugen_barcode_splitter/merger.rb', line 20 def sample_ids @sample_ids end |
Instance Method Details
#make_stats(statistics) ⇒ Object
83 84 85 86 87 88 89 90 |
# File 'lib/nugen_barcode_splitter/merger.rb', line 83 def make_stats(statistics) stats = "" @sample_ids.each_with_index do |id,i| stats += id +"\t" + statistics[i].to_s + "\n" end stats += "unmatched\t" + statistics[-2].to_s + "\n" stats += "total\t" + statistics[-1].to_s + "\n" end |
#merge ⇒ Object
22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 |
# File 'lib/nugen_barcode_splitter/merger.rb', line 22 def merge() statistics = Array.new(@sample_ids.length()+2,0) fwd_file = Zlib::GzipReader.open(@fwd) rev_file = Zlib::GzipReader.open(@rev) fwd_splitted_files = [] fwd_out_files = [] rev_out_files = [] fwd_out_unmatched = File.open(@outdir+"/R1_#{@number}.unmatched.updated.fq",'w') rev_out_unmatched = File.open(@outdir+"/R2_#{@number}.unmatched.updated.fq",'w') @sample_ids.each_with_index do |sample_id, i| fwd_splitted_files[i] = File.open(@outdir+"/R1_#{@number}.#{sample_id}.fq") fwd_out_files[i] = File.open(@outdir+"/R1_#{@number}.#{sample_id}.updated.fq",'w') rev_out_files[i] = File.open(@outdir+"/R2_#{@number}.#{sample_id}.updated.fq",'w') end fwd_file.each do |fwd_line| statistics[-1] += 1 rev_line = rev_file.readline() rev_name = rev_line.split(" ") fwd_name = fwd_line.split(" ") marker = true @sample_ids.each_with_index do |sample_id, i| if !fwd_splitted_files[i].eof? && marker compare_line_fwd = fwd_splitted_files[i].readline() name_compare_fwd = compare_line_fwd.split(" ") if fwd_name[0] == name_compare_fwd[0] marker = false statistics[i] += 1 fwd_out_files[i].write(fwd_line) rev_out_files[i].write(rev_line) for k in 1..3 fwd_file.readline() compare_line_fwd = fwd_splitted_files[i].readline() fwd_out_files[i].write(compare_line_fwd.gsub(/^[A-Z]{4}/,"NNNN")) if k == 1 fwd_out_files[i].write(compare_line_fwd) if k == 2 fwd_out_files[i].write(compare_line_fwd.gsub(/^[\S]{4}/,"@@@@")) if k == 3 rev_out_files[i].write(rev_file.readline()) end fwd_file.lineno = fwd_file.lineno - 1 rev_file.lineno = rev_file.lineno - 1 else fwd_splitted_files[i].pos = fwd_splitted_files[i].pos - compare_line_fwd.length() end end end if marker statistics[-2] += 1 fwd_out_unmatched.write(fwd_line) rev_out_unmatched.write(rev_line) for k in 1..3 rev_out_unmatched.write(rev_file.readline()) fwd_out_unmatched.write(fwd_file.readline()) end end end stats = make_stats(statistics) end |