Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Elegant headers & params syntax #2

Merged
merged 2 commits into from
Oct 21, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 3 additions & 2 deletions docs/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -46,8 +46,9 @@ WITH __input AS (
'https://httpbin.org/delay/0',
headers => MAP {
'accept': 'application/json',
}::VARCHAR,
params => MAP {}::VARCHAR
},
params => MAP {
}
) AS data
),
__features AS (
Expand Down
42 changes: 24 additions & 18 deletions src/http_client_extension.cpp
Original file line number Diff line number Diff line change
@@ -1,6 +1,8 @@
#define DUCKDB_EXTENSION_MAIN
#include "http_client_extension.hpp"
#include "duckdb.hpp"
#include "duckdb/common/types.hpp"
#include "duckdb/common/vector_operations/generic_executor.hpp"
#include "duckdb/function/scalar_function.hpp"
#include "duckdb/main/extension_util.hpp"
#include "duckdb/common/atomic.hpp"
Expand Down Expand Up @@ -118,14 +120,18 @@ static void HTTPGetRequestFunction(DataChunk &args, ExpressionState &state, Vect
static void HTTPPostRequestFunction(DataChunk &args, ExpressionState &state, Vector &result) {
D_ASSERT(args.data.size() == 3);

using STRING_TYPE = PrimitiveType<string_t>;
using LENTRY_TYPE = PrimitiveType<list_entry_t>;

auto &url_vector = args.data[0];
auto &headers_vector = args.data[1];
auto &headers_entry = ListVector::GetEntry(headers_vector);
auto &body_vector = args.data[2];

TernaryExecutor::Execute<string_t, string_t, string_t, string_t>(
GenericExecutor::ExecuteTernary<STRING_TYPE, LENTRY_TYPE, STRING_TYPE, STRING_TYPE>(
url_vector, headers_vector, body_vector, result, args.size(),
[&](string_t url, string_t headers, string_t body) {
std::string url_str = url.GetString();
[&](STRING_TYPE url, LENTRY_TYPE headers, STRING_TYPE body) {
std::string url_str = url.val.GetString();

// Use helper to setup client and parse URL
auto client_and_path = SetupHttpClient(url_str);
Expand All @@ -134,24 +140,24 @@ static void HTTPPostRequestFunction(DataChunk &args, ExpressionState &state, Vec

// Prepare headers
duckdb_httplib_openssl::Headers header_map;
std::istringstream header_stream(headers.GetString());
std::string header;
while (std::getline(header_stream, header)) {
size_t colon_pos = header.find(':');
if (colon_pos != std::string::npos) {
std::string key = header.substr(0, colon_pos);
std::string value = header.substr(colon_pos + 1);
// Trim leading and trailing whitespace
key.erase(0, key.find_first_not_of(" \t"));
key.erase(key.find_last_not_of(" \t") + 1);
value.erase(0, value.find_first_not_of(" \t"));
value.erase(value.find_last_not_of(" \t") + 1);
header_map.emplace(key, value);
auto header_list = headers.val;
for (idx_t i = header_list.offset; i < header_list.offset + header_list.length; i++) {
const auto &child_value = headers_entry.GetValue(i);

Vector tmp(child_value);
auto &children = StructVector::GetEntries(tmp);

if (children.size() == 2) {
auto name = FlatVector::GetData<string_t>(*children[0]);
auto data = FlatVector::GetData<string_t>(*children[1]);
std::string key = name->GetString();
std::string val = data->GetString();
header_map.emplace(key, val);
}
}

// Make the POST request with headers and body
auto res = client.Post(path.c_str(), header_map, body.GetString(), "application/json");
auto res = client.Post(path.c_str(), header_map, body.val.GetString(), "application/json");
if (res) {
if (res->status == 200) {
return StringVector::AddString(result, res->body);
Expand All @@ -175,7 +181,7 @@ static void LoadInternal(DatabaseInstance &instance) {

ScalarFunctionSet http_post("http_post");
http_post.AddFunction(ScalarFunction(
{LogicalType::VARCHAR, LogicalType::VARCHAR, LogicalType::VARCHAR},
{LogicalType::VARCHAR, LogicalType::MAP(LogicalType::VARCHAR, LogicalType::VARCHAR), LogicalType::JSON()},
LogicalType::VARCHAR, HTTPPostRequestFunction));
ExtensionUtil::RegisterFunction(instance, http_post);
}
Expand Down
39 changes: 37 additions & 2 deletions test/sql/httpclient.test
Original file line number Diff line number Diff line change
Expand Up @@ -44,8 +44,9 @@ WITH __input AS (
'https://httpbin.org/delay/0',
headers => MAP {
'accept': 'application/json',
}::VARCHAR,
params => MAP {}::VARCHAR
},
params => MAP {
}
) AS data
),
__features AS (
Expand All @@ -62,3 +63,37 @@ WITH __input AS (
;
----
httpbin.org

# Confirm the POST extension works with headers and params
query I
WITH __input AS (
SELECT
http_post(
'https://earth-search.aws.element84.com/v0/search',
headers => MAP {
'Content-Type': 'application/json',
'Accept-Encoding': 'gzip',
'Accept': 'application/geo+json'
},
params => {
'collections': ['sentinel-s2-l2a-cogs'],
'ids': ['S2A_56LPN_20210930_0_L2A'],
'datetime': '2021-09-30/2021-09-30',
'limit': 10
}
) AS data
),
__features AS (
SELECT
unnest( from_json((data::JSON)->'features', '["json"]') )
AS features
FROM
__input
)
SELECT
features->>'id' AS id
FROM
__features
;
----
S2A_56LPN_20210930_0_L2A
Loading