1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
| | # -*- encoding: binary -*-
module Unicorn
# acts like tee(1) on an input input to provide a input-like stream
# while providing rewindable semantics through a File/StringIO backing
# store. On the first pass, the input is only read on demand so your
# Rack application can use input notification (upload progress and
# like). This should fully conform to the Rack::Lint::InputWrapper
# specification on the public API. This class is intended to be a
# strict interpretation of Rack::Lint::InputWrapper functionality and
# will not support any deviations from it.
#
# When processing uploads, Unicorn exposes a TeeInput object under
# "rack.input" of the Rack environment.
class TeeInput < Struct.new(:socket, :req, :parser, :buf, :len, :tmp, :buf2)
# Initializes a new TeeInput object. You normally do not have to call
# this unless you are writing an HTTP server.
def initialize(*args)
super(*args)
self.len = parser.content_length
self.tmp = len && len < Const::MAX_BODY ? StringIO.new("") : Util.tmpio
self.buf2 = ""
if buf.size > 0
parser.filter_body(buf2, buf) and finalize_input
tmp.write(buf2)
tmp.seek(0)
end
end
# :call-seq:
# ios.size => Integer
#
# Returns the size of the input. For requests with a Content-Length
# header value, this will not read data off the socket and just return
# the value of the Content-Length header as an Integer.
#
# For Transfer-Encoding:chunked requests, this requires consuming
# all of the input stream before returning since there's no other
# way to determine the size of the request body beforehand.
#
# This method is no longer part of the Rack specification as of
# Rack 1.2, so its use is not recommended. This method only exists
# for compatibility with Rack applications designed for Rack 1.1 and
# earlier. Most applications should only need to call +read+ with a
# specified +length+ in a loop until it returns +nil+.
def size
len and return len
if socket
pos = tmp.pos
while tee(Const::CHUNK_SIZE, buf2)
end
tmp.seek(pos)
end
self.len = tmp.size
end
# :call-seq:
# ios.read([length [, buffer ]]) => string, buffer, or nil
#
# Reads at most length bytes from the I/O stream, or to the end of
# file if length is omitted or is nil. length must be a non-negative
# integer or nil. If the optional buffer argument is present, it
# must reference a String, which will receive the data.
#
# At end of file, it returns nil or "" depend on length.
# ios.read() and ios.read(nil) returns "".
# ios.read(length [, buffer]) returns nil.
#
# If the Content-Length of the HTTP request is known (as is the common
# case for POST requests), then ios.read(length [, buffer]) will block
# until the specified length is read (or it is the last chunk).
# Otherwise, for uncommon "Transfer-Encoding: chunked" requests,
# ios.read(length [, buffer]) will return immediately if there is
# any data and only block when nothing is available (providing
# IO#readpartial semantics).
def read(*args)
socket or return tmp.read(*args)
length = args.shift
if nil == length
rv = tmp.read || ""
while tee(Const::CHUNK_SIZE, buf2)
rv << buf2
end
rv
else
rv = args.shift || ""
diff = tmp.size - tmp.pos
if 0 == diff
ensure_length(tee(length, rv), length)
else
ensure_length(tmp.read(diff > length ? length : diff, rv), length)
end
end
end
# :call-seq:
# ios.gets => string or nil
#
# Reads the next ``line'' from the I/O stream; lines are separated
# by the global record separator ($/, typically "\n"). A global
# record separator of nil reads the entire unread contents of ios.
# Returns nil if called at the end of file.
# This takes zero arguments for strict Rack::Lint compatibility,
# unlike IO#gets.
def gets
socket or return tmp.gets
sep = $/ or return read
orig_size = tmp.size
if tmp.pos == orig_size
tee(Const::CHUNK_SIZE, buf2) or return nil
tmp.seek(orig_size)
end
sep_size = Rack::Utils.bytesize(sep)
line = tmp.gets # cannot be nil here since size > pos
sep == line[-sep_size, sep_size] and return line
# unlikely, if we got here, then tmp is at EOF
begin
orig_size = tmp.pos
tee(Const::CHUNK_SIZE, buf2) or break
tmp.seek(orig_size)
line << tmp.gets
sep == line[-sep_size, sep_size] and return line
# tmp is at EOF again here, retry the loop
end while true
line
end
# :call-seq:
# ios.each { |line| block } => ios
#
# Executes the block for every ``line'' in *ios*, where lines are
# separated by the global record separator ($/, typically "\n").
def each(&block)
while line = gets
yield line
end
self # Rack does not specify what the return value is here
end
# :call-seq:
# ios.rewind => 0
#
# Positions the *ios* pointer to the beginning of input, returns
# the offset (zero) of the +ios+ pointer. Subsequent reads will
# start from the beginning of the previously-buffered input.
def rewind
tmp.rewind # Rack does not specify what the return value is here
end
private
def client_error(e)
case e
when EOFError
# in case client only did a premature shutdown(SHUT_WR)
# we do support clients that shutdown(SHUT_WR) after the
# _entire_ request has been sent, and those will not have
# raised EOFError on us.
socket.close if socket
raise ClientShutdown, "bytes_read=#{tmp.size}", []
when HttpParserError
e.set_backtrace([])
end
raise e
end
# tees off a +length+ chunk of data from the input into the IO
# backing store as well as returning it. +dst+ must be specified.
# returns nil if reading from the input returns nil
def tee(length, dst)
unless parser.body_eof?
if parser.filter_body(dst, socket.readpartial(length, buf)).nil?
tmp.write(dst)
tmp.seek(0, IO::SEEK_END) # workaround FreeBSD/OSX + MRI 1.8.x bug
return dst
end
end
finalize_input
rescue => e
client_error(e)
end
def finalize_input
while parser.trailers(req, buf).nil?
# Don't worry about raising ClientShutdown here on EOFError, tee()
# will catch EOFError when app is processing it, otherwise in
# initialize we never get any chance to enter the app so the
# EOFError will just get trapped by Unicorn and not the Rack app
buf << socket.readpartial(Const::CHUNK_SIZE)
end
self.socket = nil
end
# tee()s into +dst+ until it is of +length+ bytes (or until
# we've reached the Content-Length of the request body).
# Returns +dst+ (the exact object, not a duplicate)
# To continue supporting applications that need near-real-time
# streaming input bodies, this is a no-op for
# "Transfer-Encoding: chunked" requests.
def ensure_length(dst, length)
# len is nil for chunked bodies, so we can't ensure length for those
# since they could be streaming bidirectionally and we don't want to
# block the caller in that case.
return dst if dst.nil? || len.nil?
while dst.size < length && tee(length - dst.size, buf2)
dst << buf2
end
dst
end
end
end
|