2010-08-12 22:55:48 +08:00
|
|
|
/***************************************************************************
|
|
|
|
* _ _ ____ _
|
|
|
|
* Project ___| | | | _ \| |
|
|
|
|
* / __| | | | |_) | |
|
|
|
|
* | (__| |_| | _ <| |___
|
|
|
|
* \___|\___/|_| \_\_____|
|
|
|
|
*
|
2023-01-02 20:51:48 +08:00
|
|
|
* Copyright (C) Daniel Stenberg, <daniel@haxx.se>, et al.
|
2010-08-12 22:55:48 +08:00
|
|
|
*
|
|
|
|
* This software is licensed as described in the file COPYING, which
|
|
|
|
* you should have received as part of this distribution. The terms
|
2020-11-04 21:02:01 +08:00
|
|
|
* are also available at https://curl.se/docs/copyright.html.
|
2010-08-12 22:55:48 +08:00
|
|
|
*
|
|
|
|
* You may opt to use, copy, modify, merge, publish, distribute and/or sell
|
|
|
|
* copies of the Software, and permit persons to whom the Software is
|
|
|
|
* furnished to do so, under the terms of the COPYING file.
|
|
|
|
*
|
|
|
|
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
|
|
|
|
* KIND, either express or implied.
|
|
|
|
*
|
2021-01-09 00:58:15 +08:00
|
|
|
* SPDX-License-Identifier: curl
|
2022-05-17 17:16:50 +08:00
|
|
|
*
|
2010-08-12 22:55:48 +08:00
|
|
|
***************************************************************************/
|
|
|
|
|
2013-01-07 02:06:49 +08:00
|
|
|
#include "curl_setup.h"
|
2010-08-12 22:55:48 +08:00
|
|
|
|
|
|
|
#ifndef CURL_DISABLE_GOPHER
|
|
|
|
|
2013-01-04 09:50:28 +08:00
|
|
|
#include "urldata.h"
|
2010-08-12 22:55:48 +08:00
|
|
|
#include <curl/curl.h>
|
2013-01-04 09:50:28 +08:00
|
|
|
#include "transfer.h"
|
|
|
|
#include "sendf.h"
|
2022-11-11 18:45:34 +08:00
|
|
|
#include "cfilters.h"
|
2020-04-12 20:03:38 +08:00
|
|
|
#include "connect.h"
|
2013-01-04 09:50:28 +08:00
|
|
|
#include "progress.h"
|
|
|
|
#include "gopher.h"
|
|
|
|
#include "select.h"
|
2018-12-12 23:58:18 +08:00
|
|
|
#include "strdup.h"
|
2020-11-16 01:46:06 +08:00
|
|
|
#include "vtls/vtls.h"
|
2013-01-04 09:50:28 +08:00
|
|
|
#include "url.h"
|
2016-10-08 17:21:38 +08:00
|
|
|
#include "escape.h"
|
2013-01-04 09:50:28 +08:00
|
|
|
#include "warnless.h"
|
2018-12-12 23:58:18 +08:00
|
|
|
#include "curl_printf.h"
|
2012-11-17 07:59:42 +08:00
|
|
|
#include "curl_memory.h"
|
2010-08-12 22:55:48 +08:00
|
|
|
/* The last #include file should be: */
|
2013-01-04 09:50:28 +08:00
|
|
|
#include "memdebug.h"
|
2010-08-12 22:55:48 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Forward declarations.
|
|
|
|
*/
|
|
|
|
|
2021-01-09 00:58:15 +08:00
|
|
|
static CURLcode gopher_do(struct Curl_easy *data, bool *done);
|
2020-11-16 01:46:06 +08:00
|
|
|
#ifdef USE_SSL
|
2021-01-09 00:58:15 +08:00
|
|
|
static CURLcode gopher_connect(struct Curl_easy *data, bool *done);
|
|
|
|
static CURLcode gopher_connecting(struct Curl_easy *data, bool *done);
|
2020-11-16 01:46:06 +08:00
|
|
|
#endif
|
2010-08-12 22:55:48 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Gopher protocol handler.
|
|
|
|
* This is also a nice simple template to build off for simple
|
|
|
|
* connect-command-download protocols.
|
|
|
|
*/
|
|
|
|
|
|
|
|
const struct Curl_handler Curl_handler_gopher = {
|
|
|
|
"GOPHER", /* scheme */
|
|
|
|
ZERO_NULL, /* setup_connection */
|
|
|
|
gopher_do, /* do_it */
|
|
|
|
ZERO_NULL, /* done */
|
|
|
|
ZERO_NULL, /* do_more */
|
|
|
|
ZERO_NULL, /* connect_it */
|
|
|
|
ZERO_NULL, /* connecting */
|
|
|
|
ZERO_NULL, /* doing */
|
|
|
|
ZERO_NULL, /* proto_getsock */
|
|
|
|
ZERO_NULL, /* doing_getsock */
|
2011-10-22 05:36:54 +08:00
|
|
|
ZERO_NULL, /* domore_getsock */
|
2010-08-12 22:55:48 +08:00
|
|
|
ZERO_NULL, /* perform_getsock */
|
|
|
|
ZERO_NULL, /* disconnect */
|
lib: replace readwrite with write_resp
This clarifies the handling of server responses by folding the code for
the complicated protocols into their protocol handlers. This concerns
mainly HTTP and its bastard sibling RTSP.
The terms "read" and "write" are often used without clear context if
they refer to the connect or the client/application side of a
transfer. This PR uses "read/write" for operations on the client side
and "send/receive" for the connection, e.g. server side. If this is
considered useful, we can revisit renaming of further methods in another
PR.
Curl's protocol handler `readwrite()` method been changed:
```diff
- CURLcode (*readwrite)(struct Curl_easy *data, struct connectdata *conn,
- const char *buf, size_t blen,
- size_t *pconsumed, bool *readmore);
+ CURLcode (*write_resp)(struct Curl_easy *data, const char *buf, size_t blen,
+ bool is_eos, bool *done);
```
The name was changed to clarify that this writes reponse data to the
client side. The parameter changes are:
* `conn` removed as it always operates on `data->conn`
* `pconsumed` removed as the method needs to handle all data on success
* `readmore` removed as no longer necessary
* `is_eos` as indicator that this is the last call for the transfer
response (end-of-stream).
* `done` TRUE on return iff the transfer response is to be treated as
finished
This change affects many files only because of updated comments in
handlers that provide no implementation. The real change is that the
HTTP protocol handlers now provide an implementation.
The HTTP protocol handlers `write_resp()` implementation will get passed
**all** raw data of a server response for the transfer. The HTTP/1.x
formatted status and headers, as well as the undecoded response
body. `Curl_http_write_resp_hds()` is used internally to parse the
response headers and pass them on. This method is public as the RTSP
protocol handler also uses it.
HTTP/1.1 "chunked" transport encoding is now part of the general
*content encoding* writer stack, just like other encodings. A new flag
`CLIENTWRITE_EOS` was added for the last client write. This allows
writers to verify that they are in a valid end state. The chunked
decoder will check if it indeed has seen the last chunk.
The general response handling in `transfer.c:466` happens in function
`readwrite_data()`. This mainly operates now like:
```
static CURLcode readwrite_data(data, ...)
{
do {
Curl_xfer_recv_resp(data, buf)
...
Curl_xfer_write_resp(data, buf)
...
} while(interested);
...
}
```
All the response data handling is implemented in
`Curl_xfer_write_resp()`. It calls the protocol handler's `write_resp()`
implementation if available, or does the default behaviour.
All raw response data needs to pass through this function. Which also
means that anyone in possession of such data may call
`Curl_xfer_write_resp()`.
Closes #12480
2023-12-01 20:50:32 +08:00
|
|
|
ZERO_NULL, /* write_resp */
|
2024-03-21 19:15:59 +08:00
|
|
|
ZERO_NULL, /* write_resp_hd */
|
2017-05-31 19:09:56 +08:00
|
|
|
ZERO_NULL, /* connection_check */
|
2021-05-17 14:54:00 +08:00
|
|
|
ZERO_NULL, /* attach connection */
|
2010-08-12 22:55:48 +08:00
|
|
|
PORT_GOPHER, /* defport */
|
2011-03-15 05:52:14 +08:00
|
|
|
CURLPROTO_GOPHER, /* protocol */
|
2020-09-21 19:45:24 +08:00
|
|
|
CURLPROTO_GOPHER, /* family */
|
2011-03-15 05:22:22 +08:00
|
|
|
PROTOPT_NONE /* flags */
|
2010-08-12 22:55:48 +08:00
|
|
|
};
|
|
|
|
|
2020-11-16 01:46:06 +08:00
|
|
|
#ifdef USE_SSL
|
|
|
|
const struct Curl_handler Curl_handler_gophers = {
|
|
|
|
"GOPHERS", /* scheme */
|
|
|
|
ZERO_NULL, /* setup_connection */
|
|
|
|
gopher_do, /* do_it */
|
|
|
|
ZERO_NULL, /* done */
|
|
|
|
ZERO_NULL, /* do_more */
|
|
|
|
gopher_connect, /* connect_it */
|
|
|
|
gopher_connecting, /* connecting */
|
|
|
|
ZERO_NULL, /* doing */
|
|
|
|
ZERO_NULL, /* proto_getsock */
|
|
|
|
ZERO_NULL, /* doing_getsock */
|
|
|
|
ZERO_NULL, /* domore_getsock */
|
|
|
|
ZERO_NULL, /* perform_getsock */
|
|
|
|
ZERO_NULL, /* disconnect */
|
lib: replace readwrite with write_resp
This clarifies the handling of server responses by folding the code for
the complicated protocols into their protocol handlers. This concerns
mainly HTTP and its bastard sibling RTSP.
The terms "read" and "write" are often used without clear context if
they refer to the connect or the client/application side of a
transfer. This PR uses "read/write" for operations on the client side
and "send/receive" for the connection, e.g. server side. If this is
considered useful, we can revisit renaming of further methods in another
PR.
Curl's protocol handler `readwrite()` method been changed:
```diff
- CURLcode (*readwrite)(struct Curl_easy *data, struct connectdata *conn,
- const char *buf, size_t blen,
- size_t *pconsumed, bool *readmore);
+ CURLcode (*write_resp)(struct Curl_easy *data, const char *buf, size_t blen,
+ bool is_eos, bool *done);
```
The name was changed to clarify that this writes reponse data to the
client side. The parameter changes are:
* `conn` removed as it always operates on `data->conn`
* `pconsumed` removed as the method needs to handle all data on success
* `readmore` removed as no longer necessary
* `is_eos` as indicator that this is the last call for the transfer
response (end-of-stream).
* `done` TRUE on return iff the transfer response is to be treated as
finished
This change affects many files only because of updated comments in
handlers that provide no implementation. The real change is that the
HTTP protocol handlers now provide an implementation.
The HTTP protocol handlers `write_resp()` implementation will get passed
**all** raw data of a server response for the transfer. The HTTP/1.x
formatted status and headers, as well as the undecoded response
body. `Curl_http_write_resp_hds()` is used internally to parse the
response headers and pass them on. This method is public as the RTSP
protocol handler also uses it.
HTTP/1.1 "chunked" transport encoding is now part of the general
*content encoding* writer stack, just like other encodings. A new flag
`CLIENTWRITE_EOS` was added for the last client write. This allows
writers to verify that they are in a valid end state. The chunked
decoder will check if it indeed has seen the last chunk.
The general response handling in `transfer.c:466` happens in function
`readwrite_data()`. This mainly operates now like:
```
static CURLcode readwrite_data(data, ...)
{
do {
Curl_xfer_recv_resp(data, buf)
...
Curl_xfer_write_resp(data, buf)
...
} while(interested);
...
}
```
All the response data handling is implemented in
`Curl_xfer_write_resp()`. It calls the protocol handler's `write_resp()`
implementation if available, or does the default behaviour.
All raw response data needs to pass through this function. Which also
means that anyone in possession of such data may call
`Curl_xfer_write_resp()`.
Closes #12480
2023-12-01 20:50:32 +08:00
|
|
|
ZERO_NULL, /* write_resp */
|
2024-03-21 19:15:59 +08:00
|
|
|
ZERO_NULL, /* write_resp_hd */
|
2020-11-16 01:46:06 +08:00
|
|
|
ZERO_NULL, /* connection_check */
|
2021-05-17 14:54:00 +08:00
|
|
|
ZERO_NULL, /* attach connection */
|
2020-11-16 01:46:06 +08:00
|
|
|
PORT_GOPHER, /* defport */
|
2021-01-06 00:22:09 +08:00
|
|
|
CURLPROTO_GOPHERS, /* protocol */
|
2020-11-16 01:46:06 +08:00
|
|
|
CURLPROTO_GOPHER, /* family */
|
|
|
|
PROTOPT_SSL /* flags */
|
|
|
|
};
|
|
|
|
|
2021-01-09 00:58:15 +08:00
|
|
|
static CURLcode gopher_connect(struct Curl_easy *data, bool *done)
|
2020-11-16 01:46:06 +08:00
|
|
|
{
|
2021-01-09 00:58:15 +08:00
|
|
|
(void)data;
|
2020-11-16 01:46:06 +08:00
|
|
|
(void)done;
|
|
|
|
return CURLE_OK;
|
|
|
|
}
|
|
|
|
|
2021-01-09 00:58:15 +08:00
|
|
|
static CURLcode gopher_connecting(struct Curl_easy *data, bool *done)
|
2020-11-16 01:46:06 +08:00
|
|
|
{
|
2021-01-09 00:58:15 +08:00
|
|
|
struct connectdata *conn = data->conn;
|
2022-11-11 18:45:34 +08:00
|
|
|
CURLcode result;
|
|
|
|
|
2022-11-22 16:55:41 +08:00
|
|
|
result = Curl_conn_connect(data, FIRSTSOCKET, TRUE, done);
|
2020-11-16 01:46:06 +08:00
|
|
|
if(result)
|
|
|
|
connclose(conn, "Failed TLS connection");
|
|
|
|
*done = TRUE;
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2021-01-09 00:58:15 +08:00
|
|
|
static CURLcode gopher_do(struct Curl_easy *data, bool *done)
|
2010-08-12 22:55:48 +08:00
|
|
|
{
|
2017-09-10 05:09:06 +08:00
|
|
|
CURLcode result = CURLE_OK;
|
2021-01-09 00:58:15 +08:00
|
|
|
struct connectdata *conn = data->conn;
|
2010-08-12 22:55:48 +08:00
|
|
|
curl_socket_t sockfd = conn->sock[FIRSTSOCKET];
|
2018-12-12 23:58:18 +08:00
|
|
|
char *gopherpath;
|
2018-09-15 05:33:28 +08:00
|
|
|
char *path = data->state.up.path;
|
2018-12-12 23:58:18 +08:00
|
|
|
char *query = data->state.up.query;
|
2017-03-04 08:17:24 +08:00
|
|
|
char *sel = NULL;
|
2010-08-25 05:14:00 +08:00
|
|
|
char *sel_org = NULL;
|
2020-04-12 20:03:38 +08:00
|
|
|
timediff_t timeout_ms;
|
lib: Curl_read/Curl_write clarifications
- replace `Curl_read()`, `Curl_write()` and `Curl_nwrite()` to
clarify when and at what level they operate
- send/recv of transfer related data is now done via
`Curl_xfer_send()/Curl_xfer_recv()` which no longer has
socket/socketindex as parameter. It decides on the transfer
setup of `conn->sockfd` and `conn->writesockfd` on which
connection filter chain to operate.
- send/recv on a specific connection filter chain is done via
`Curl_conn_send()/Curl_conn_recv()` which get the socket index
as parameter.
- rename `Curl_setup_transfer()` to `Curl_xfer_setup()` for
naming consistency
- clarify that the special CURLE_AGAIN hangling to return
`CURLE_OK` with length 0 only applies to `Curl_xfer_send()`
and CURLE_AGAIN is returned by all other send() variants.
- fix a bug in websocket `curl_ws_recv()` that mixed up data
when it arrived in more than a single chunk
The method for sending not just raw bytes, but bytes that are either
"headers" or "body". The send abstraction stack, to to bottom, now is:
* `Curl_req_send()`: has parameter to indicate amount of header bytes,
buffers all data.
* `Curl_xfer_send()`: knows on which socket index to send, returns
amount of bytes sent.
* `Curl_conn_send()`: called with socket index, returns amount of bytes
sent.
In addition there is `Curl_req_flush()` for writing out all buffered
bytes.
`Curl_req_send()` is active for requests without body,
`Curl_buffer_send()` still being used for others. This is because the
special quirks need to be addressed in future parts:
* `expect-100` handling
* `Curl_fillreadbuffer()` needs to add directly to the new
`data->req.sendbuf`
* special body handlings, like `chunked` encodings and line end
conversions will be moved into something like a Client Reader.
In functions of the pattern `CURLcode xxx_send(..., ssize_t *written)`,
replace the `ssize_t` with a `size_t`. It makes no sense to allow for negative
values as the returned `CURLcode` already specifies error conditions. This
allows easier handling of lengths without casting.
Closes #12964
2024-02-15 23:22:53 +08:00
|
|
|
ssize_t k;
|
|
|
|
size_t amount, len;
|
2020-04-12 20:03:38 +08:00
|
|
|
int what;
|
2010-08-12 22:55:48 +08:00
|
|
|
|
|
|
|
*done = TRUE; /* unconditionally */
|
|
|
|
|
2019-03-04 19:22:51 +08:00
|
|
|
/* path is guaranteed non-NULL */
|
|
|
|
DEBUGASSERT(path);
|
|
|
|
|
|
|
|
if(query)
|
2018-12-12 23:58:18 +08:00
|
|
|
gopherpath = aprintf("%s?%s", path, query);
|
|
|
|
else
|
|
|
|
gopherpath = strdup(path);
|
|
|
|
|
|
|
|
if(!gopherpath)
|
|
|
|
return CURLE_OUT_OF_MEMORY;
|
|
|
|
|
2010-08-12 22:55:48 +08:00
|
|
|
/* Create selector. Degenerate cases: / and /1 => convert to "" */
|
2018-12-12 23:58:18 +08:00
|
|
|
if(strlen(gopherpath) <= 2) {
|
2010-08-12 22:55:48 +08:00
|
|
|
sel = (char *)"";
|
2018-08-31 16:17:40 +08:00
|
|
|
len = strlen(sel);
|
2018-12-13 22:06:17 +08:00
|
|
|
free(gopherpath);
|
2015-10-01 23:17:58 +08:00
|
|
|
}
|
2010-08-12 22:55:48 +08:00
|
|
|
else {
|
|
|
|
char *newp;
|
|
|
|
|
|
|
|
/* Otherwise, drop / and the first character (i.e., item type) ... */
|
2018-12-12 23:58:18 +08:00
|
|
|
newp = gopherpath;
|
2017-09-10 05:09:06 +08:00
|
|
|
newp += 2;
|
2010-08-12 22:55:48 +08:00
|
|
|
|
|
|
|
/* ... and finally unescape */
|
2022-02-03 20:04:30 +08:00
|
|
|
result = Curl_urldecode(newp, 0, &sel, &len, REJECT_ZERO);
|
2018-12-12 23:58:18 +08:00
|
|
|
free(gopherpath);
|
2017-02-26 07:10:30 +08:00
|
|
|
if(result)
|
|
|
|
return result;
|
2010-08-25 05:14:00 +08:00
|
|
|
sel_org = sel;
|
2010-08-12 22:55:48 +08:00
|
|
|
}
|
|
|
|
|
2015-10-01 23:17:58 +08:00
|
|
|
k = curlx_uztosz(len);
|
2010-08-25 05:14:00 +08:00
|
|
|
|
2010-08-24 05:30:59 +08:00
|
|
|
for(;;) {
|
2020-11-16 01:46:06 +08:00
|
|
|
/* Break out of the loop if the selector is empty because OpenSSL and/or
|
|
|
|
LibreSSL fail with errno 0 if this is the case. */
|
|
|
|
if(strlen(sel) < 1)
|
|
|
|
break;
|
|
|
|
|
2024-02-14 19:09:32 +08:00
|
|
|
result = Curl_xfer_send(data, sel, k, &amount);
|
2014-10-24 04:56:35 +08:00
|
|
|
if(!result) { /* Which may not have written it all! */
|
2021-01-09 00:58:15 +08:00
|
|
|
result = Curl_client_write(data, CLIENTWRITE_HEADER, sel, amount);
|
2016-10-18 17:12:03 +08:00
|
|
|
if(result)
|
|
|
|
break;
|
|
|
|
|
2010-08-24 05:30:59 +08:00
|
|
|
k -= amount;
|
|
|
|
sel += amount;
|
2011-04-20 21:17:42 +08:00
|
|
|
if(k < 1)
|
2010-08-24 05:30:59 +08:00
|
|
|
break; /* but it did write it all */
|
2010-08-25 05:14:00 +08:00
|
|
|
}
|
2016-10-18 17:12:03 +08:00
|
|
|
else
|
|
|
|
break;
|
|
|
|
|
2021-01-19 05:57:56 +08:00
|
|
|
timeout_ms = Curl_timeleft(data, NULL, FALSE);
|
2020-04-12 20:03:38 +08:00
|
|
|
if(timeout_ms < 0) {
|
|
|
|
result = CURLE_OPERATION_TIMEDOUT;
|
|
|
|
break;
|
|
|
|
}
|
2020-04-15 16:27:20 +08:00
|
|
|
if(!timeout_ms)
|
|
|
|
timeout_ms = TIMEDIFF_T_MAX;
|
2020-04-12 20:03:38 +08:00
|
|
|
|
2010-08-25 05:14:00 +08:00
|
|
|
/* Don't busyloop. The entire loop thing is a work-around as it causes a
|
|
|
|
BLOCKING behavior which is a NO-NO. This function should rather be
|
|
|
|
split up in a do and a doing piece where the pieces that aren't
|
|
|
|
possible to send now will be sent in the doing function repeatedly
|
|
|
|
until the entire request is sent.
|
|
|
|
*/
|
2020-04-15 16:27:20 +08:00
|
|
|
what = SOCKET_WRITABLE(sockfd, timeout_ms);
|
2020-04-12 20:03:38 +08:00
|
|
|
if(what < 0) {
|
2016-10-18 17:12:03 +08:00
|
|
|
result = CURLE_SEND_ERROR;
|
|
|
|
break;
|
|
|
|
}
|
2020-04-12 20:03:38 +08:00
|
|
|
else if(!what) {
|
|
|
|
result = CURLE_OPERATION_TIMEDOUT;
|
|
|
|
break;
|
|
|
|
}
|
2010-08-24 05:30:59 +08:00
|
|
|
}
|
2010-08-25 05:14:00 +08:00
|
|
|
|
2015-03-16 22:01:15 +08:00
|
|
|
free(sel_org);
|
2010-08-25 05:14:00 +08:00
|
|
|
|
2016-10-18 17:12:03 +08:00
|
|
|
if(!result)
|
2024-02-14 19:09:32 +08:00
|
|
|
result = Curl_xfer_send(data, "\r\n", 2, &amount);
|
2014-10-24 04:56:35 +08:00
|
|
|
if(result) {
|
2010-08-12 22:55:48 +08:00
|
|
|
failf(data, "Failed sending Gopher request");
|
|
|
|
return result;
|
|
|
|
}
|
2021-01-09 00:58:15 +08:00
|
|
|
result = Curl_client_write(data, CLIENTWRITE_HEADER, (char *)"\r\n", 2);
|
2010-08-25 06:45:17 +08:00
|
|
|
if(result)
|
|
|
|
return result;
|
2010-08-24 05:30:59 +08:00
|
|
|
|
2024-02-14 19:09:32 +08:00
|
|
|
Curl_xfer_setup(data, FIRSTSOCKET, -1, FALSE, -1);
|
2010-08-12 22:55:48 +08:00
|
|
|
return CURLE_OK;
|
|
|
|
}
|
2022-10-31 00:38:16 +08:00
|
|
|
#endif /* CURL_DISABLE_GOPHER */
|