Skip to content

Commit a95d661

Browse files
authored
Add UDTF that detects linux kernel header installation and add column to GetAgentStatus (#2052)
Summary: Add UDTF that detects linux kernel header installation and add column to `GetAgentStatus` This is a prerequisite to accomplish #2051. The `px deploy` command uses the GetAgentStatus UDTF in its final [healthcheck step](https://github.com/pixie-io/pixie/blob/854062111cf4b91a40649a2e2647c88c0a68b0db/src/pixie_cli/pkg/cmd/deploy.go#L607-L613). With this kernel header detection in place, the `px` cli can use the results from the `px/agent_status` script to print a warning message if kernel headers aren't detected. The helm install flow needs to be covered as well. My hope is that this UDTF could be used for that use case as well, but I need to further investigate the details of that. Relevant Issues: #2051 Type of change: /kind feature Test Plan: Skaffolded to a Ubuntu GKE cluster and tested the following - [x] Kelvin always reports `false` as it doesn't bind mount `/` to `/host` - [x] PEM running on host without `linux-headers-$(uname -r)` package reports `false` - [x] PEM running on host with `linux-headers-$(uname -r)` package reports `true` ``` $ gcloud compute ssh gke-dev-cluster-ddelnano-default-pool-a27c1ac2-x5k2 --internal-ip -- 'ls -alh /lib/modules/$(uname -r)/build' lrwxrwxrwx 1 root root 38 Aug 9 15:25 /lib/modules/5.15.0-1065-gke/build -> /usr/src/linux-headers-5.15.0-1065-gke $ gcloud compute ssh gke-dev-cluster-ddelnano-default-pool-a27c1ac2-j6pg --internal-ip -- 'ls -alh /lib/modules/$(uname -r)/build' ls: cannot access '/lib/modules/5.15.0-1065-gke/build': No such file or directory ``` ![Screen Shot 2024-12-02 at 9 30 29 AM](https://github.com/user-attachments/assets/9fa862f8-5a6c-46d6-8899-bfaf2bdf3371) Changelog Message: Add `GetLinuxHeadersStatus` UDTF and add `kernel_headers_installed` column to `GetAgentStatus` --------- Signed-off-by: Dom Del Nano <[email protected]>
1 parent 672e351 commit a95d661

17 files changed

+353
-126
lines changed

src/common/system/kernel_version.h

+5
Original file line numberDiff line numberDiff line change
@@ -75,6 +75,11 @@ enum class KernelVersionOrder {
7575
kNewer,
7676
};
7777

78+
struct KernelInfo {
79+
KernelVersion version;
80+
bool kernel_headers_installed;
81+
};
82+
7883
// Compares two kernel versions and detect their relationship.
7984
KernelVersionOrder CompareKernelVersions(KernelVersion a, KernelVersion b);
8085

+78
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,78 @@
1+
/*
2+
* Copyright 2018- The Pixie Authors.
3+
*
4+
* Licensed under the Apache License, Version 2.0 (the "License");
5+
* you may not use this file except in compliance with the License.
6+
* You may obtain a copy of the License at
7+
*
8+
* http://www.apache.org/licenses/LICENSE-2.0
9+
*
10+
* Unless required by applicable law or agreed to in writing, software
11+
* distributed under the License is distributed on an "AS IS" BASIS,
12+
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13+
* See the License for the specific language governing permissions and
14+
* limitations under the License.
15+
*
16+
* SPDX-License-Identifier: Apache-2.0
17+
*/
18+
19+
#include "src/common/system/linux_headers_utils.h"
20+
21+
#include <fstream>
22+
#include <limits>
23+
#include <memory>
24+
#include <string>
25+
26+
#include "src/common/base/file.h"
27+
#include "src/common/fs/fs_wrapper.h"
28+
#include "src/common/system/config.h"
29+
30+
namespace px {
31+
namespace system {
32+
33+
StatusOr<std::filesystem::path> ResolvePossibleSymlinkToHostPath(const std::filesystem::path p) {
34+
// Check if "p" is a symlink.
35+
std::error_code ec;
36+
const bool is_symlink = std::filesystem::is_symlink(p, ec);
37+
if (ec) {
38+
return error::NotFound(absl::Substitute("Did not find the host headers at path: $0, $1.",
39+
p.string(), ec.message()));
40+
}
41+
42+
if (!is_symlink) {
43+
// Not a symlink, we are good now.
44+
return p;
45+
}
46+
47+
// Resolve the symlink, and re-convert to a host path..
48+
const std::filesystem::path resolved = std::filesystem::read_symlink(p, ec);
49+
if (ec) {
50+
return error::Internal(ec.message());
51+
}
52+
53+
// Relative paths containing "../" can result in an invalid host mount path when using
54+
// ToHostPath. Therefore, we need to treat the absolute and relative cases differently.
55+
std::filesystem::path resolved_host_path;
56+
if (resolved.is_absolute()) {
57+
resolved_host_path = system::Config::GetInstance().ToHostPath(resolved);
58+
VLOG(1) << absl::Substitute(
59+
"Symlink target is an absolute path. Converting that to host path: $0 -> $1.",
60+
resolved.string(), resolved_host_path.string());
61+
} else {
62+
resolved_host_path = p.parent_path();
63+
resolved_host_path /= resolved.string();
64+
VLOG(1) << absl::Substitute(
65+
"Symlink target is a relative path. Concatenating it to parent directory: $0",
66+
resolved_host_path.string());
67+
}
68+
69+
// Downstream won't be ok unless the resolved host path exists; return an error if needed.
70+
if (!fs::Exists(resolved_host_path)) {
71+
return error::NotFound(absl::Substitute("Did not find host headers at resolved path: $0.",
72+
resolved_host_path.string()));
73+
}
74+
return resolved_host_path;
75+
}
76+
77+
} // namespace system
78+
} // namespace px
+46
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,46 @@
1+
/*
2+
* Copyright 2018- The Pixie Authors.
3+
*
4+
* Licensed under the Apache License, Version 2.0 (the "License");
5+
* you may not use this file except in compliance with the License.
6+
* You may obtain a copy of the License at
7+
*
8+
* http://www.apache.org/licenses/LICENSE-2.0
9+
*
10+
* Unless required by applicable law or agreed to in writing, software
11+
* distributed under the License is distributed on an "AS IS" BASIS,
12+
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13+
* See the License for the specific language governing permissions and
14+
* limitations under the License.
15+
*
16+
* SPDX-License-Identifier: Apache-2.0
17+
*/
18+
19+
#pragma once
20+
21+
#include <filesystem>
22+
23+
#include "src/common/base/base.h"
24+
25+
namespace px {
26+
namespace system {
27+
28+
constexpr std::string_view kLinuxModulesDir = "/lib/modules/";
29+
30+
/**
31+
* Resolves a possible symlink path to its corresponding host filesystem path.
32+
*
33+
* This function takes a filesystem path and checks if it is a symbolic link. If it is,
34+
* the symlink is resolved to its target path. Depending on whether the target is an absolute
35+
* or relative path, it is further processed to convert it into a valid host path (as in
36+
* Config::ToHostPath(...) path).
37+
*
38+
* If the input path is not a symlink, it is returned as-is. The function ensures that
39+
* the final resolved path exists in the host filesystem before returning it. Errors are
40+
* returned when the path does not exist, the resolution fails, or when there is an issue
41+
* accessing the filesystem.
42+
*/
43+
StatusOr<std::filesystem::path> ResolvePossibleSymlinkToHostPath(const std::filesystem::path p);
44+
45+
} // namespace system
46+
} // namespace px

src/stirling/utils/linux_headers.cc

+6-47
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,7 @@
3131
#include "src/common/fs/temp_file.h"
3232
#include "src/common/minitar/minitar.h"
3333
#include "src/common/system/config.h"
34+
#include "src/common/system/linux_headers_utils.h"
3435
#include "src/common/system/proc_pid_path.h"
3536
#include "src/common/zlib/zlib_wrapper.h"
3637

@@ -83,7 +84,7 @@ StatusOr<std::filesystem::path> FindKernelConfig() {
8384
// Search for /boot/config-<uname>
8485
syscfg.ToHostPath(absl::StrCat("/boot/config-", uname)),
8586
// Search for /lib/modules/<uname>/config
86-
syscfg.ToHostPath(absl::StrCat("/lib/modules/", uname, "/config")),
87+
syscfg.ToHostPath(absl::StrCat(px::system::kLinuxModulesDir, uname, "/config")),
8788
// TODO(yzhao): https://github.com/lima-vm/alpine-lima/issues/67 once this issue is resolved,
8889
// we might consider change these 2 paths into something recommended by rancher-desktop.
8990
// The path used by `alpine-lima` in "Live CD" boot mechanism.
@@ -209,55 +210,12 @@ Status FindLinuxHeadersDirectory(const std::filesystem::path& lib_modules_dir) {
209210
return error::NotFound("Could not find 'source' or 'build' under $0.", lib_modules_dir.string());
210211
}
211212

212-
StatusOr<std::filesystem::path> ResolvePossibleSymlinkToHostPath(const std::filesystem::path p) {
213-
// Check if "p" is a symlink.
214-
std::error_code ec;
215-
const bool is_symlink = std::filesystem::is_symlink(p, ec);
216-
if (ec) {
217-
return error::NotFound(absl::Substitute("Did not find the host headers at path: $0, $1.",
218-
p.string(), ec.message()));
219-
}
220-
221-
if (!is_symlink) {
222-
// Not a symlink, we are good now.
223-
return p;
224-
}
225-
226-
// Resolve the symlink, and re-convert to a host path..
227-
const std::filesystem::path resolved = std::filesystem::read_symlink(p, ec);
228-
if (ec) {
229-
return error::Internal(ec.message());
230-
}
231-
232-
// Relative paths containing "../" can result in an invalid host mount path when using
233-
// ToHostPath. Therefore, we need to treat the absolute and relative cases differently.
234-
std::filesystem::path resolved_host_path;
235-
if (resolved.is_absolute()) {
236-
resolved_host_path = system::Config::GetInstance().ToHostPath(resolved);
237-
VLOG(1) << absl::Substitute(
238-
"Symlink target is an absolute path. Converting that to host path: $0 -> $1.",
239-
resolved.string(), resolved_host_path.string());
240-
} else {
241-
resolved_host_path = p.parent_path();
242-
resolved_host_path /= resolved.string();
243-
VLOG(1) << absl::Substitute(
244-
"Symlink target is a relative path. Concatenating it to parent directory: $0",
245-
resolved_host_path.string());
246-
}
247-
248-
// Downstream won't be ok unless the resolved host path exists; return an error if needed.
249-
if (!fs::Exists(resolved_host_path)) {
250-
return error::NotFound(absl::Substitute("Did not find host headers at resolved path: $0.",
251-
resolved_host_path.string()));
252-
}
253-
return resolved_host_path;
254-
}
255-
256213
Status LinkHostLinuxHeadersKernel(const std::filesystem::path& lib_modules_dir) {
257214
const auto host_path = system::Config::GetInstance().ToHostPath(lib_modules_dir);
258215
LOG(INFO) << absl::Substitute("Looking for host Linux headers at $0.", host_path.string());
259216

260-
PX_ASSIGN_OR_RETURN(const auto resolved_host_path, ResolvePossibleSymlinkToHostPath(host_path));
217+
PX_ASSIGN_OR_RETURN(const auto resolved_host_path,
218+
system::ResolvePossibleSymlinkToHostPath(host_path));
261219
PX_RETURN_IF_ERROR(fs::CreateSymlinkIfNotExists(resolved_host_path, lib_modules_dir));
262220
LOG(INFO) << absl::Substitute("Linked host headers at $0 to symlink in pem namespace at $1.",
263221
resolved_host_path.string(), lib_modules_dir.string());
@@ -401,7 +359,8 @@ Status FindOrInstallLinuxHeaders() {
401359
// However we find Linux headers (below) we link them into the mount namespace of this
402360
// process using one (or both) of the above paths.
403361

404-
const std::filesystem::path pem_ns_lib_modules_dir = "/lib/modules/" + uname;
362+
const std::filesystem::path pem_ns_lib_modules_dir =
363+
std::string(px::system::kLinuxModulesDir) + uname;
405364

406365
// Create (or verify existence); does nothing if the directory already exists.
407366
PX_RETURN_IF_ERROR(fs::CreateDirectories(pem_ns_lib_modules_dir));

src/vizier/funcs/md_udtfs/md_udtfs.cc

+2
Original file line numberDiff line numberDiff line change
@@ -37,6 +37,8 @@ void RegisterFuncsOrDie(const VizierFuncFactoryContext& ctx, carnot::udf::Regist
3737
registry->RegisterFactoryOrDie<GetProfilerSamplingPeriodMS,
3838
UDTFWithMDFactory<GetProfilerSamplingPeriodMS>>(
3939
"GetProfilerSamplingPeriodMS", ctx);
40+
registry->RegisterFactoryOrDie<GetLinuxHeadersStatus, UDTFWithMDFactory<GetLinuxHeadersStatus>>(
41+
"GetLinuxHeadersStatus", ctx);
4042

4143
registry->RegisterOrDie<GetDebugMDState>("_DebugMDState");
4244
registry->RegisterFactoryOrDie<GetDebugMDWithPrefix, UDTFWithMDFactory<GetDebugMDWithPrefix>>(

src/vizier/funcs/md_udtfs/md_udtfs_impl.h

+63-1
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,10 @@ namespace px {
4343
namespace vizier {
4444
namespace funcs {
4545
namespace md {
46+
47+
constexpr std::string_view kKernelHeadersInstalledDesc =
48+
"Whether the agent had linux headers pre-installed";
49+
4650
template <typename TUDTF>
4751
class UDTFWithMDFactory : public carnot::udf::UDTFFactory {
4852
public:
@@ -295,7 +299,9 @@ class GetAgentStatus final : public carnot::udf::UDTF<GetAgentStatus> {
295299
ColInfo("create_time", types::DataType::TIME64NS, types::PatternType::GENERAL,
296300
"The creation time of the agent"),
297301
ColInfo("last_heartbeat_ns", types::DataType::INT64, types::PatternType::GENERAL,
298-
"Time (in nanoseconds) since the last heartbeat"));
302+
"Time (in nanoseconds) since the last heartbeat"),
303+
ColInfo("kernel_headers_installed", types::DataType::BOOLEAN, types::PatternType::GENERAL,
304+
kKernelHeadersInstalledDesc));
299305
}
300306

301307
Status Init(FunctionContext*) {
@@ -330,6 +336,8 @@ class GetAgentStatus final : public carnot::udf::UDTF<GetAgentStatus> {
330336
rw->Append<IndexOf("agent_state")>(StringValue(magic_enum::enum_name(agent_status.state())));
331337
rw->Append<IndexOf("create_time")>(agent_info.create_time_ns());
332338
rw->Append<IndexOf("last_heartbeat_ns")>(agent_status.ns_since_last_heartbeat());
339+
rw->Append<IndexOf("kernel_headers_installed")>(
340+
agent_info.info().host_info().kernel_headers_installed());
333341

334342
++idx_;
335343
return idx_ < resp_->info_size();
@@ -396,6 +404,60 @@ class GetProfilerSamplingPeriodMS final : public carnot::udf::UDTF<GetProfilerSa
396404
std::function<void(grpc::ClientContext*)> add_context_authentication_func_;
397405
};
398406

407+
/**
408+
* This UDTF retrieves the status of the agents' Linux headers installation.
409+
*/
410+
class GetLinuxHeadersStatus final : public carnot::udf::UDTF<GetLinuxHeadersStatus> {
411+
public:
412+
using MDSStub = vizier::services::metadata::MetadataService::Stub;
413+
using SchemaResponse = vizier::services::metadata::SchemaResponse;
414+
GetLinuxHeadersStatus() = delete;
415+
GetLinuxHeadersStatus(std::shared_ptr<MDSStub> stub,
416+
std::function<void(grpc::ClientContext*)> add_context_authentication)
417+
: idx_(0), stub_(stub), add_context_authentication_func_(add_context_authentication) {}
418+
419+
static constexpr auto Executor() { return carnot::udfspb::UDTFSourceExecutor::UDTF_ONE_KELVIN; }
420+
421+
static constexpr auto OutputRelation() {
422+
return MakeArray(
423+
ColInfo("asid", types::DataType::INT64, types::PatternType::GENERAL, "The Agent Short ID"),
424+
ColInfo("kernel_headers_installed", types::DataType::BOOLEAN, types::PatternType::GENERAL,
425+
kKernelHeadersInstalledDesc));
426+
}
427+
428+
Status Init(FunctionContext*) {
429+
px::vizier::services::metadata::AgentInfoRequest req;
430+
resp_ = std::make_unique<px::vizier::services::metadata::AgentInfoResponse>();
431+
432+
grpc::ClientContext ctx;
433+
add_context_authentication_func_(&ctx);
434+
auto s = stub_->GetAgentInfo(&ctx, req, resp_.get());
435+
if (!s.ok()) {
436+
return error::Internal("Failed to make RPC call to GetAgentInfo");
437+
}
438+
return Status::OK();
439+
}
440+
441+
bool NextRecord(FunctionContext*, RecordWriter* rw) {
442+
const auto& agent_metadata = resp_->info(idx_);
443+
const auto& agent_info = agent_metadata.agent();
444+
445+
const auto asid = agent_info.asid();
446+
const auto kernel_headers_installed = agent_info.info().host_info().kernel_headers_installed();
447+
rw->Append<IndexOf("asid")>(asid);
448+
rw->Append<IndexOf("kernel_headers_installed")>(kernel_headers_installed);
449+
450+
++idx_;
451+
return idx_ < resp_->info_size();
452+
}
453+
454+
private:
455+
int idx_ = 0;
456+
std::unique_ptr<px::vizier::services::metadata::AgentInfoResponse> resp_;
457+
std::shared_ptr<MDSStub> stub_;
458+
std::function<void(grpc::ClientContext*)> add_context_authentication_func_;
459+
};
460+
399461
namespace internal {
400462
inline rapidjson::GenericStringRef<char> StringRef(std::string_view s) {
401463
return rapidjson::GenericStringRef<char>(s.data(), s.size());

src/vizier/services/agent/kelvin/kelvin_main.cc

+5-1
Original file line numberDiff line numberDiff line change
@@ -91,8 +91,12 @@ int main(int argc, char** argv) {
9191
LOG(INFO) << absl::Substitute("Pixie Kelvin. Version: $0, id: $1, kernel: $2",
9292
px::VersionInfo::VersionString(), agent_id.str(),
9393
kernel_version.ToString());
94+
auto kernel_info = px::system::KernelInfo{
95+
kernel_version,
96+
false /* kernel_headers_installed */,
97+
};
9498
auto manager = KelvinManager::Create(agent_id, FLAGS_pod_name, FLAGS_host_ip, addr,
95-
FLAGS_rpc_port, FLAGS_nats_url, mds_addr, kernel_version)
99+
FLAGS_rpc_port, FLAGS_nats_url, mds_addr, kernel_info)
96100
.ConsumeValueOrDie();
97101

98102
TerminationHandler::set_manager(manager.get());

src/vizier/services/agent/kelvin/kelvin_manager.h

+2-2
Original file line numberDiff line numberDiff line change
@@ -44,9 +44,9 @@ class KelvinManager : public Manager {
4444
KelvinManager() = delete;
4545
KelvinManager(sole::uuid agent_id, std::string_view pod_name, std::string_view host_ip,
4646
std::string_view addr, int grpc_server_port, std::string_view nats_url,
47-
std::string_view mds_url, system::KernelVersion kernel_version)
47+
std::string_view mds_url, system::KernelInfo kernel_info)
4848
: Manager(agent_id, pod_name, host_ip, grpc_server_port, KelvinManager::Capabilities(),
49-
KelvinManager::Parameters(), nats_url, mds_url, kernel_version) {
49+
KelvinManager::Parameters(), nats_url, mds_url, kernel_info) {
5050
info()->address = std::string(addr);
5151
}
5252

src/vizier/services/agent/pem/pem_main.cc

+17-1
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@
2525
#include "src/common/base/base.h"
2626
#include "src/common/signal/signal.h"
2727
#include "src/common/system/kernel_version.h"
28+
#include "src/common/system/linux_headers_utils.h"
2829
#include "src/shared/version/version.h"
2930

3031
DEFINE_string(nats_url, gflags::StringFromEnv("PL_NATS_URL", "pl-nats"),
@@ -68,8 +69,23 @@ int main(int argc, char** argv) {
6869
LOG(INFO) << absl::Substitute("Pixie PEM. Version: $0, id: $1, kernel version: $2",
6970
px::VersionInfo::VersionString(), agent_id.str(),
7071
kernel_version.ToString());
72+
73+
auto kernel_headers_installed = false;
74+
auto uname = px::system::GetUname();
75+
if (uname.ok()) {
76+
const auto host_path = px::system::Config::GetInstance().ToHostPath(
77+
absl::StrCat(px::system::kLinuxModulesDir, uname.ConsumeValueOrDie(), "/build"));
78+
79+
const auto resolved_host_path = px::system::ResolvePossibleSymlinkToHostPath(host_path);
80+
kernel_headers_installed = resolved_host_path.ok();
81+
}
82+
83+
auto kernel_info = px::system::KernelInfo{
84+
kernel_version,
85+
kernel_headers_installed,
86+
};
7187
auto manager =
72-
PEMManager::Create(agent_id, FLAGS_pod_name, FLAGS_host_ip, FLAGS_nats_url, kernel_version)
88+
PEMManager::Create(agent_id, FLAGS_pod_name, FLAGS_host_ip, FLAGS_nats_url, kernel_info)
7389
.ConsumeValueOrDie();
7490

7591
TerminationHandler::set_manager(manager.get());

0 commit comments

Comments
 (0)