Class: CSV::Parser::InputsScanner
- Inherits:
-
Object
- Object
- CSV::Parser::InputsScanner
- Defined in:
- lib/csv/parser.rb
Overview
CSV::InputsScanner receives IO inputs, encoding and the chunk_size. It also controls the life cycle of the object with its methods keep_start, keep_end, keep_back, keep_drop.
CSV::InputsScanner.scan() tries to match with pattern at the current position. If there’s a match, the scanner advances the “scan pointer” and returns the matched string. Otherwise, the scanner returns nil.
CSV::InputsScanner.rest() returns the “rest” of the string (i.e. everything after the scan pointer). If there is no more data (eos? = true), it returns “”.
Instance Method Summary collapse
- #each_line(row_separator) {|buffer| ... } ⇒ Object
- #eos? ⇒ Boolean
-
#initialize(inputs, encoding, chunk_size: 8192) ⇒ InputsScanner
constructor
A new instance of InputsScanner.
- #keep_back ⇒ Object
- #keep_drop ⇒ Object
- #keep_end ⇒ Object
- #keep_start ⇒ Object
- #rest ⇒ Object
- #scan(pattern) ⇒ Object
- #scan_all(pattern) ⇒ Object
Constructor Details
#initialize(inputs, encoding, chunk_size: 8192) ⇒ InputsScanner
Returns a new instance of InputsScanner.
88 89 90 91 92 93 94 95 |
# File 'lib/csv/parser.rb', line 88 def initialize(inputs, encoding, chunk_size: 8192) @inputs = inputs.dup @encoding = encoding @chunk_size = chunk_size @last_scanner = @inputs.empty? @keeps = [] read_chunk end |
Instance Method Details
#each_line(row_separator) {|buffer| ... } ⇒ Object
97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 |
# File 'lib/csv/parser.rb', line 97 def each_line(row_separator) buffer = nil input = @scanner.rest position = @scanner.pos offset = 0 n_row_separator_chars = row_separator.size while true input.each_line(row_separator) do |line| @scanner.pos += line.bytesize if buffer if n_row_separator_chars == 2 and buffer.end_with?(row_separator[0]) and line.start_with?(row_separator[1]) buffer << line[0] line = line[1..-1] position += buffer.bytesize + offset @scanner.pos = position offset = 0 yield(buffer) buffer = nil next if line.empty? else buffer << line line = buffer buffer = nil end end if line.end_with?(row_separator) position += line.bytesize + offset @scanner.pos = position offset = 0 yield(line) else buffer = line end end break unless read_chunk input = @scanner.rest position = @scanner.pos offset = -buffer.bytesize if buffer end yield(buffer) if buffer end |
#eos? ⇒ Boolean
164 165 166 |
# File 'lib/csv/parser.rb', line 164 def eos? @scanner.eos? end |
#keep_back ⇒ Object
182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 |
# File 'lib/csv/parser.rb', line 182 def keep_back start, buffer = @keeps.pop if buffer string = @scanner.string keep = string.byteslice(start, string.bytesize - start) if keep and not keep.empty? @inputs.unshift(StringIO.new(keep)) @last_scanner = false end @scanner = StringScanner.new(buffer) else @scanner.pos = start end read_chunk if @scanner.eos? end |
#keep_drop ⇒ Object
198 199 200 |
# File 'lib/csv/parser.rb', line 198 def keep_drop @keeps.pop end |
#keep_end ⇒ Object
172 173 174 175 176 177 178 179 180 |
# File 'lib/csv/parser.rb', line 172 def keep_end start, buffer = @keeps.pop keep = @scanner.string.byteslice(start, @scanner.pos - start) if buffer buffer << keep keep = buffer end keep end |
#keep_start ⇒ Object
168 169 170 |
# File 'lib/csv/parser.rb', line 168 def keep_start @keeps.push([@scanner.pos, nil]) end |
#rest ⇒ Object
202 203 204 |
# File 'lib/csv/parser.rb', line 202 def rest @scanner.rest end |
#scan(pattern) ⇒ Object
141 142 143 144 145 146 147 148 149 150 151 |
# File 'lib/csv/parser.rb', line 141 def scan(pattern) value = @scanner.scan(pattern) return value if @last_scanner if value read_chunk if @scanner.eos? return value else nil end end |
#scan_all(pattern) ⇒ Object
153 154 155 156 157 158 159 160 161 162 |
# File 'lib/csv/parser.rb', line 153 def scan_all(pattern) value = @scanner.scan(pattern) return value if @last_scanner return nil if value.nil? while @scanner.eos? and read_chunk and (sub_value = @scanner.scan(pattern)) value << sub_value end value end |