|
|
|
@ -0,0 +1,254 @@
|
|
|
|
|
/**
|
|
|
|
|
* Defines data structures and parsing methods for dealing with multipart
|
|
|
|
|
* encoded request bodies.
|
|
|
|
|
*/
|
|
|
|
|
module handy_http_data.multipart;
|
|
|
|
|
|
|
|
|
|
import handy_http_primitives.request;
|
|
|
|
|
import handy_http_primitives.response;
|
|
|
|
|
import handy_http_primitives.optional;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* A single element that's part of a multipart/form-data body.
|
|
|
|
|
*/
|
|
|
|
|
struct MultipartElement {
|
|
|
|
|
/**
|
|
|
|
|
* The name of this element, as declared by this part's Content-Disposition
|
|
|
|
|
* header `name` property. There is no guarantee that this name is unique
|
|
|
|
|
* among all elements.
|
|
|
|
|
*/
|
|
|
|
|
string name;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The filename of this element, as declared by this part's
|
|
|
|
|
* Content-Disposition header `filename` property. Note that this may be
|
|
|
|
|
* null if no filename exists.
|
|
|
|
|
*/
|
|
|
|
|
Optional!string filename = Optional!string.empty;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The headers that were present with this element.
|
|
|
|
|
*/
|
|
|
|
|
string[string] headers;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The body content of this element.
|
|
|
|
|
*/
|
|
|
|
|
string content;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* A multipart/form-data body containing multiple elements, and some helper
|
|
|
|
|
* methods for those elements.
|
|
|
|
|
*/
|
|
|
|
|
struct MultipartFormData {
|
|
|
|
|
MultipartElement[] elements;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Determines if this form-data has an element with the given name. This
|
|
|
|
|
* is case-sensitive. Note that there may be more than one element with a
|
|
|
|
|
* given name.
|
|
|
|
|
* Params:
|
|
|
|
|
* elementName = The name of the element to search for.
|
|
|
|
|
* Returns: True if this form-data has such an element.
|
|
|
|
|
*/
|
|
|
|
|
bool has(string elementName) const {
|
|
|
|
|
foreach (element; elements) {
|
|
|
|
|
if (element.name == elementName) return true;
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* An exception that's thrown if parsing multipart/form-data fails due to
|
|
|
|
|
* invalid formatting or unexpected characters. This is a sub-class of the
|
|
|
|
|
* `HttpStatusException`, with each multipart exception being a BAD_REQUEST.
|
|
|
|
|
*/
|
|
|
|
|
class MultipartFormatException : HttpStatusException {
|
|
|
|
|
public this(string message) {
|
|
|
|
|
super(HttpStatus.BAD_REQUEST, message);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* The maximum number of parts to read in a multipart/form-data body. This is
|
|
|
|
|
* declared as a safety measure to avoid infinite reading of malicious or
|
|
|
|
|
* corrupted payloads.
|
|
|
|
|
*/
|
|
|
|
|
const MAX_ELEMENTS = 1024;
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Reads a request's body as multipart/form-data encoded elements.
|
|
|
|
|
* Params:
|
|
|
|
|
* request = The request to read from.
|
|
|
|
|
* allowInfiniteRead = Whether to read until no more data is available.
|
|
|
|
|
* Returns: The multipart/form-data that was read.
|
|
|
|
|
*/
|
|
|
|
|
MultipartFormData readBodyAsMultipartFormData(ref ServerHttpRequest request, bool allowInfiniteRead = false) {
|
|
|
|
|
import std.algorithm : startsWith;
|
|
|
|
|
string contentType = request.getHeaderAs!string("Content-Type");
|
|
|
|
|
if (!contentType.startsWith("multipart/form-data")) {
|
|
|
|
|
throw new MultipartFormatException("Content-Type is not multipart/form-data.");
|
|
|
|
|
}
|
|
|
|
|
size_t boundaryIdx = indexOf(contentType, "boundary=")
|
|
|
|
|
.orElseThrow(() => new MultipartFormatException("Missing multipart boundary definition."));
|
|
|
|
|
string boundary = contentType[boundaryIdx + "boundary=".length .. $];
|
|
|
|
|
string content = request.readBodyAsString(allowInfiniteRead);
|
|
|
|
|
return parseMultipartFormData(content, boundary);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* A simple linear parser for multipart/form-data encoded content. Reads a
|
|
|
|
|
* series of elements separated by a given boundary. An exception is thrown
|
|
|
|
|
* if the given content doesn't conform to standard multipart format.
|
|
|
|
|
*
|
|
|
|
|
* The main purpose of this function is to parse the multipart boundaries and
|
|
|
|
|
* hand-off parsing of each element to `readElement`.
|
|
|
|
|
* Params:
|
|
|
|
|
* content = The content to parse.
|
|
|
|
|
* boundary = The boundary between parts. This is usually present in an HTTP
|
|
|
|
|
* request's Content-Type header.
|
|
|
|
|
* Returns: The multipart/form-data content that's been parsed.
|
|
|
|
|
*/
|
|
|
|
|
MultipartFormData parseMultipartFormData(string content, string boundary) {
|
|
|
|
|
import std.array : RefAppender, appender;
|
|
|
|
|
const string boundaryNormal = "--" ~ boundary ~ "\r\n";
|
|
|
|
|
const string boundaryEnd = "--" ~ boundary ~ "--";
|
|
|
|
|
size_t nextIdx = 0; // The index in `content` to start reading from each iteration.
|
|
|
|
|
ushort elementCount = 0; // The number of elements we've read so far.
|
|
|
|
|
MultipartFormData data; // The multipart data that's been accumulated.
|
|
|
|
|
RefAppender!(MultipartElement[]) partAppender = appender(&data.elements);
|
|
|
|
|
while (elementCount < MAX_ELEMENTS) {
|
|
|
|
|
// Check that we have enough data to read a boundary marker.
|
|
|
|
|
if (content.length < nextIdx + boundary.length + 4) {
|
|
|
|
|
throw new MultipartFormatException(
|
|
|
|
|
"Unable to read next boundary marker: " ~
|
|
|
|
|
content[nextIdx .. $] ~
|
|
|
|
|
". Expected " ~ boundary
|
|
|
|
|
);
|
|
|
|
|
}
|
|
|
|
|
string nextBoundary = content[nextIdx .. nextIdx + boundary.length + 4];
|
|
|
|
|
if (nextBoundary == boundaryEnd) {
|
|
|
|
|
break; // We just read an ending boundary marker, so we're done here.
|
|
|
|
|
} else if (nextBoundary == boundaryNormal) {
|
|
|
|
|
// Find the end index of this element.
|
|
|
|
|
const size_t elementStartIdx = nextIdx + boundary.length + 4;
|
|
|
|
|
const size_t elementEndIdx = indexOf(content, "--" ~ boundary, elementStartIdx)
|
|
|
|
|
.orElseThrow(() => new MultipartFormatException(
|
|
|
|
|
"Could not find ending boundary marker for multipart element."
|
|
|
|
|
));
|
|
|
|
|
partAppender ~= readElement(content[elementStartIdx .. elementEndIdx]);
|
|
|
|
|
nextIdx = elementEndIdx;
|
|
|
|
|
elementCount++;
|
|
|
|
|
} else {
|
|
|
|
|
throw new MultipartFormatException("Invalid boundary: " ~ nextBoundary);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return data;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Reads a single multipart element. An exception is thrown if the given
|
|
|
|
|
* content doesn't represent a valid multipart/form-data element.
|
|
|
|
|
* Params:
|
|
|
|
|
* content = The raw content of the element, including headers and body.
|
|
|
|
|
* Returns: The element that was read.
|
|
|
|
|
*/
|
|
|
|
|
private MultipartElement readElement(string content) {
|
|
|
|
|
MultipartElement element;
|
|
|
|
|
size_t bodyIdx = parseElementHeaders(element, content);
|
|
|
|
|
parseContentDisposition(element);
|
|
|
|
|
element.content = content[bodyIdx .. $ - 2]; // Ignore the trailing \r\n at the end of the body.
|
|
|
|
|
return element;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Parses the headers for a multipart element.
|
|
|
|
|
* Params:
|
|
|
|
|
* element = A reference to the element that's being parsed.
|
|
|
|
|
* content = The content to parse.
|
|
|
|
|
* Returns: The index at which the header ends, and the body starts.
|
|
|
|
|
*/
|
|
|
|
|
private size_t parseElementHeaders(ref MultipartElement element, string content) {
|
|
|
|
|
import std.string : strip;
|
|
|
|
|
size_t nextHeaderIdx = 0;
|
|
|
|
|
size_t bodyIdx = content.length;
|
|
|
|
|
bool parsingHeaders = true;
|
|
|
|
|
while (parsingHeaders) {
|
|
|
|
|
string headerContent;
|
|
|
|
|
Optional!size_t headerEndIdx = indexOf(content, "\r\n", nextHeaderIdx);
|
|
|
|
|
if (!headerEndIdx) {
|
|
|
|
|
// We couldn't find the end of the next header line, so assume that there's no body and this is the last header.
|
|
|
|
|
headerContent = content[nextHeaderIdx .. $];
|
|
|
|
|
parsingHeaders = false;
|
|
|
|
|
} else {
|
|
|
|
|
// We found the end of the next header line.
|
|
|
|
|
headerContent = content[nextHeaderIdx .. headerEndIdx.value];
|
|
|
|
|
nextHeaderIdx = headerEndIdx.value + 2;
|
|
|
|
|
// Check to see if this is the last header (expect one more \r\n after the normal ending).
|
|
|
|
|
if (content.length >= nextHeaderIdx + 2 && content[nextHeaderIdx .. nextHeaderIdx + 2] == "\r\n") {
|
|
|
|
|
bodyIdx = nextHeaderIdx + 2;
|
|
|
|
|
parsingHeaders = false;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
size_t headerValueSeparatorIdx = indexOf(headerContent, ":")
|
|
|
|
|
.orElseThrow(() => new MultipartFormatException("Invalid header line: " ~ headerContent));
|
|
|
|
|
// const ulong headerValueSeparatorIdx = countUntil(headerContent, ":");
|
|
|
|
|
string headerName = strip(headerContent[0 .. headerValueSeparatorIdx]);
|
|
|
|
|
string headerValue = strip(headerContent[headerValueSeparatorIdx + 1 .. $]);
|
|
|
|
|
element.headers[headerName] = headerValue;
|
|
|
|
|
}
|
|
|
|
|
return bodyIdx;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Parses and populates multipart element metadata according to information
|
|
|
|
|
* found in the element's Content-Disposition header.
|
|
|
|
|
* Params:
|
|
|
|
|
* element = A reference to the element that's being parsed.
|
|
|
|
|
*/
|
|
|
|
|
private void parseContentDisposition(ref MultipartElement element) {
|
|
|
|
|
import std.algorithm : startsWith, endsWith;
|
|
|
|
|
import std.string : split, strip;
|
|
|
|
|
import std.uri : decodeComponent;
|
|
|
|
|
if ("Content-Disposition" !in element.headers) {
|
|
|
|
|
throw new MultipartFormatException("Missing required Content-Disposition header for multipart element.");
|
|
|
|
|
}
|
|
|
|
|
string contentDisposition = element.headers["Content-Disposition"];
|
|
|
|
|
string[] cdParts = split(contentDisposition, ";");
|
|
|
|
|
foreach (string part; cdParts) {
|
|
|
|
|
string stripped = strip(part);
|
|
|
|
|
if (startsWith(stripped, "name=\"") && endsWith(stripped, "\"")) {
|
|
|
|
|
element.name = decodeComponent(stripped[6 .. $ - 1]);
|
|
|
|
|
} else if (startsWith(stripped, "filename=\"") && endsWith(stripped, "\"")) {
|
|
|
|
|
import std.typecons : nullable;
|
|
|
|
|
element.filename = Optional!string.of(decodeComponent(stripped[10 .. $ - 1]));
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private Optional!size_t indexOf(T)(T[] array, T[] subset, size_t offset = 0) {
|
|
|
|
|
if (subset.length > array.length) return Optional!size_t.empty;
|
|
|
|
|
if (subset.length == array.length) {
|
|
|
|
|
if (offset != 0) return Optional!size_t.empty;
|
|
|
|
|
return subset == array ? Optional!size_t.of(0) : Optional!size_t.empty;
|
|
|
|
|
}
|
|
|
|
|
if (subset.length == 0) return Optional!size_t.of(0);
|
|
|
|
|
size_t index = offset;
|
|
|
|
|
while (index < (array.length - subset.length)) {
|
|
|
|
|
if (array[index .. index + subset.length] == subset) return Optional!size_t.of(index);
|
|
|
|
|
index++;
|
|
|
|
|
}
|
|
|
|
|
return Optional!size_t.empty;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
unittest {
|
|
|
|
|
assert(indexOf("abc", "a").value == 0);
|
|
|
|
|
assert(indexOf("abc", "a", 1).isNull);
|
|
|
|
|
assert(indexOf("hello world!", "world").value == 6);
|
|
|
|
|
assert(indexOf("hello world!", "world", 7).isNull);
|
|
|
|
|
assert(indexOf("hello world!", "world", 3).value == 6);
|
|
|
|
|
assert(indexOf("", "bleh").isNull);
|
|
|
|
|
assert(indexOf("", "blerg", 42).isNull);
|
|
|
|
|
}
|