mirror of
https://github.com/ceph/ceph-csi.git
synced 2024-12-29 08:20:20 +00:00
290beb4dda
Linux kernel 4.17.0 adds support for quota with CephFS. Without quota, it is not possible to fullfill the requirements of the CSI Spec and guarantee sufficient space on the filesystem for a volume. With this in mind, usage of the kernel client is only allowed with kernel 4.17.0 or newer. However, some Linux vendors backport features and patches to their Enterprise products. These kernels may have an older version, but do support quota. One of these is the kernel that comes with RHEL-7.7. By comparing the current running version of the Linux kernel against known versions that support quota, we can now automatically decide to use the kernel client, or not. Note that this does not change the 'forcekernelclient' parameter. The parameter is still available and can be used for kernels that are not in the 'known to support quota list'. Or users can pass the parameter to use a CephFS kernel client that does not support quota. Signed-off-by: Niels de Vos <ndevos@redhat.com> Signed-off-by: Madhu Rajanna <madhupr007@gmail.com>
347 lines
9.6 KiB
Go
347 lines
9.6 KiB
Go
/*
|
|
Copyright 2018 The Ceph-CSI Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
*/
|
|
|
|
package cephfs
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"os"
|
|
"os/exec"
|
|
"regexp"
|
|
"strconv"
|
|
"strings"
|
|
"sync"
|
|
|
|
"github.com/ceph/ceph-csi/pkg/util"
|
|
|
|
"golang.org/x/sys/unix"
|
|
"k8s.io/klog"
|
|
)
|
|
|
|
const (
|
|
volumeMounterFuse = "fuse"
|
|
volumeMounterKernel = "kernel"
|
|
)
|
|
|
|
var (
|
|
availableMounters []string
|
|
|
|
// maps a mountpoint to PID of its FUSE daemon
|
|
fusePidMap = make(map[string]int)
|
|
fusePidMapMtx sync.Mutex
|
|
|
|
fusePidRx = regexp.MustCompile(`(?m)^ceph-fuse\[(.+)\]: starting fuse$`)
|
|
)
|
|
|
|
// Version checking the running kernel and comparing it to known versions that
|
|
// have support for quota. Distributors of enterprise Linux have backported
|
|
// quota support to previous versions. This function checks if the running
|
|
// kernel is one of the versions that have the feature/fixes backported.
|
|
//
|
|
// `uname -r` (or Uname().Utsname.Release has a format like 1.2.3-rc.vendor
|
|
// This can be slit up in the following components:
|
|
// - version (1)
|
|
// - patchlevel (2)
|
|
// - sublevel (3) - optional, defaults to 0
|
|
// - extraversion (rc) - optional, matching integers only
|
|
// - distribution (.vendor) - optional, match against whole `uname -r` string
|
|
//
|
|
// For matching multiple versions, the kernelSupport type contains a backport
|
|
// bool, which will cause matching
|
|
// version+patchlevel+sublevel+(>=extraversion)+(~distribution)
|
|
//
|
|
// In case the backport bool is false, a simple check for higher versions than
|
|
// version+patchlevel+sublevel is done.
|
|
func kernelSupportsQuota(release string) bool {
|
|
type kernelSupport struct {
|
|
version int
|
|
patchlevel int
|
|
sublevel int
|
|
extraversion int // prefix of the part after the first "-"
|
|
distribution string // component of full extraversion
|
|
backport bool // backports have a fixed version/patchlevel/sublevel
|
|
}
|
|
|
|
quotaSupport := []kernelSupport{
|
|
{4, 17, 0, 0, "", false}, // standard 4.17+ versions
|
|
{3, 10, 0, 1062, ".el7", true}, // RHEL-7.7
|
|
}
|
|
|
|
vers := strings.Split(strings.SplitN(release, "-", 2)[0], ".")
|
|
version, err := strconv.Atoi(vers[0])
|
|
if err != nil {
|
|
klog.Errorf("failed to parse version from %s: %v", release, err)
|
|
return false
|
|
}
|
|
patchlevel, err := strconv.Atoi(vers[1])
|
|
if err != nil {
|
|
klog.Errorf("failed to parse patchlevel from %s: %v", release, err)
|
|
return false
|
|
}
|
|
sublevel := 0
|
|
if len(vers) >= 3 {
|
|
sublevel, err = strconv.Atoi(vers[2])
|
|
if err != nil {
|
|
klog.Errorf("failed to parse sublevel from %s: %v", release, err)
|
|
return false
|
|
}
|
|
}
|
|
extra := strings.SplitN(release, "-", 2)
|
|
extraversion := 0
|
|
if len(extra) == 2 {
|
|
// ignore errors, 1st component of extraversion does not need to be an int
|
|
extraversion, err = strconv.Atoi(strings.Split(extra[1], ".")[0])
|
|
if err != nil {
|
|
// "go lint" wants err to be checked...
|
|
extraversion = 0
|
|
}
|
|
}
|
|
|
|
// compare running kernel against known versions
|
|
for _, kernel := range quotaSupport {
|
|
if !kernel.backport {
|
|
// deal with the default case(s), find >= match for version, patchlevel, sublevel
|
|
if version > kernel.version || (version == kernel.version && patchlevel > kernel.patchlevel) ||
|
|
(version == kernel.version && patchlevel == kernel.patchlevel && sublevel >= kernel.sublevel) {
|
|
return true
|
|
}
|
|
} else {
|
|
// specific backport, match distribution initially
|
|
if !strings.Contains(release, kernel.distribution) {
|
|
continue
|
|
}
|
|
|
|
// strict match version, patchlevel, sublevel, and >= match extraversion
|
|
if version == kernel.version && patchlevel == kernel.patchlevel &&
|
|
sublevel == kernel.sublevel && extraversion >= kernel.extraversion {
|
|
return true
|
|
}
|
|
}
|
|
}
|
|
klog.Errorf("kernel %s does not support quota", release)
|
|
return false
|
|
}
|
|
|
|
// Load available ceph mounters installed on system into availableMounters
|
|
// Called from driver.go's Run()
|
|
func loadAvailableMounters(conf *util.Config) error {
|
|
// #nosec
|
|
fuseMounterProbe := exec.Command("ceph-fuse", "--version")
|
|
// #nosec
|
|
kernelMounterProbe := exec.Command("mount.ceph")
|
|
|
|
err := kernelMounterProbe.Run()
|
|
if err == nil {
|
|
// fetch the current running kernel info
|
|
utsname := unix.Utsname{}
|
|
err := unix.Uname(&utsname)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
release := string(utsname.Release[:64])
|
|
|
|
if conf.ForceKernelCephFS || kernelSupportsQuota(release) {
|
|
klog.Infof("loaded mounter: %s", volumeMounterKernel)
|
|
availableMounters = append(availableMounters, volumeMounterKernel)
|
|
} else {
|
|
klog.Infof("kernel version < 4.17 might not support quota feature, hence not loading kernel client")
|
|
}
|
|
}
|
|
|
|
if fuseMounterProbe.Run() == nil {
|
|
klog.Infof("loaded mounter: %s", volumeMounterFuse)
|
|
availableMounters = append(availableMounters, volumeMounterFuse)
|
|
}
|
|
|
|
if len(availableMounters) == 0 {
|
|
return errors.New("no ceph mounters found on system")
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
type volumeMounter interface {
|
|
mount(ctx context.Context, mountPoint string, cr *util.Credentials, volOptions *volumeOptions) error
|
|
name() string
|
|
}
|
|
|
|
func newMounter(volOptions *volumeOptions) (volumeMounter, error) {
|
|
// Get the mounter from the configuration
|
|
|
|
wantMounter := volOptions.Mounter
|
|
|
|
// Verify that it's available
|
|
|
|
var chosenMounter string
|
|
|
|
for _, availMounter := range availableMounters {
|
|
if availMounter == wantMounter {
|
|
chosenMounter = wantMounter
|
|
break
|
|
}
|
|
}
|
|
|
|
if chosenMounter == "" {
|
|
// Otherwise pick whatever is left
|
|
chosenMounter = availableMounters[0]
|
|
klog.Infof("requested mounter: %s, chosen mounter: %s", wantMounter, chosenMounter)
|
|
}
|
|
|
|
// Create the mounter
|
|
|
|
switch chosenMounter {
|
|
case volumeMounterFuse:
|
|
return &fuseMounter{}, nil
|
|
case volumeMounterKernel:
|
|
return &kernelMounter{}, nil
|
|
}
|
|
|
|
return nil, fmt.Errorf("unknown mounter '%s'", chosenMounter)
|
|
}
|
|
|
|
type fuseMounter struct{}
|
|
|
|
func mountFuse(ctx context.Context, mountPoint string, cr *util.Credentials, volOptions *volumeOptions) error {
|
|
args := []string{
|
|
mountPoint,
|
|
"-m", volOptions.Monitors,
|
|
"-c", util.CephConfigPath,
|
|
"-n", cephEntityClientPrefix + cr.ID, "--keyfile=" + cr.KeyFile,
|
|
"-r", volOptions.RootPath,
|
|
"-o", "nonempty",
|
|
}
|
|
|
|
if volOptions.FuseMountOptions != "" {
|
|
args = append(args, ","+volOptions.FuseMountOptions)
|
|
}
|
|
if volOptions.FsName != "" {
|
|
args = append(args, "--client_mds_namespace="+volOptions.FsName)
|
|
}
|
|
|
|
_, stderr, err := execCommand(ctx, "ceph-fuse", args[:]...)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Parse the output:
|
|
// We need "starting fuse" meaning the mount is ok
|
|
// and PID of the ceph-fuse daemon for unmount
|
|
|
|
match := fusePidRx.FindSubmatch(stderr)
|
|
if len(match) != 2 {
|
|
return fmt.Errorf("ceph-fuse failed: %s", stderr)
|
|
}
|
|
|
|
pid, err := strconv.Atoi(string(match[1]))
|
|
if err != nil {
|
|
return fmt.Errorf("failed to parse FUSE daemon PID: %v", err)
|
|
}
|
|
|
|
fusePidMapMtx.Lock()
|
|
fusePidMap[mountPoint] = pid
|
|
fusePidMapMtx.Unlock()
|
|
|
|
return nil
|
|
}
|
|
|
|
func (m *fuseMounter) mount(ctx context.Context, mountPoint string, cr *util.Credentials, volOptions *volumeOptions) error {
|
|
if err := util.CreateMountPoint(mountPoint); err != nil {
|
|
return err
|
|
}
|
|
|
|
return mountFuse(ctx, mountPoint, cr, volOptions)
|
|
}
|
|
|
|
func (m *fuseMounter) name() string { return "Ceph FUSE driver" }
|
|
|
|
type kernelMounter struct{}
|
|
|
|
func mountKernel(ctx context.Context, mountPoint string, cr *util.Credentials, volOptions *volumeOptions) error {
|
|
if err := execCommandErr(ctx, "modprobe", "ceph"); err != nil {
|
|
return err
|
|
}
|
|
|
|
args := []string{
|
|
"-t", "ceph",
|
|
fmt.Sprintf("%s:%s", volOptions.Monitors, volOptions.RootPath),
|
|
mountPoint,
|
|
}
|
|
optionsStr := fmt.Sprintf("name=%s,secretfile=%s", cr.ID, cr.KeyFile)
|
|
if volOptions.FsName != "" {
|
|
optionsStr += fmt.Sprintf(",mds_namespace=%s", volOptions.FsName)
|
|
}
|
|
if volOptions.KernelMountOptions != "" {
|
|
optionsStr += fmt.Sprintf(",%s", volOptions.KernelMountOptions)
|
|
}
|
|
args = append(args, "-o", optionsStr)
|
|
|
|
return execCommandErr(ctx, "mount", args[:]...)
|
|
}
|
|
|
|
func (m *kernelMounter) mount(ctx context.Context, mountPoint string, cr *util.Credentials, volOptions *volumeOptions) error {
|
|
if err := util.CreateMountPoint(mountPoint); err != nil {
|
|
return err
|
|
}
|
|
|
|
return mountKernel(ctx, mountPoint, cr, volOptions)
|
|
}
|
|
|
|
func (m *kernelMounter) name() string { return "Ceph kernel client" }
|
|
|
|
func bindMount(ctx context.Context, from, to string, readOnly bool, mntOptions []string) error {
|
|
mntOptionSli := strings.Join(mntOptions, ",")
|
|
if err := execCommandErr(ctx, "mount", "-o", mntOptionSli, from, to); err != nil {
|
|
return fmt.Errorf("failed to bind-mount %s to %s: %v", from, to, err)
|
|
}
|
|
|
|
if readOnly {
|
|
mntOptionSli += ",remount"
|
|
if err := execCommandErr(ctx, "mount", "-o", mntOptionSli, to); err != nil {
|
|
return fmt.Errorf("failed read-only remount of %s: %v", to, err)
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func unmountVolume(ctx context.Context, mountPoint string) error {
|
|
if err := execCommandErr(ctx, "umount", mountPoint); err != nil {
|
|
return err
|
|
}
|
|
|
|
fusePidMapMtx.Lock()
|
|
pid, ok := fusePidMap[mountPoint]
|
|
if ok {
|
|
delete(fusePidMap, mountPoint)
|
|
}
|
|
fusePidMapMtx.Unlock()
|
|
|
|
if ok {
|
|
p, err := os.FindProcess(pid)
|
|
if err != nil {
|
|
klog.Warningf(util.Log(ctx, "failed to find process %d: %v"), pid, err)
|
|
} else {
|
|
if _, err = p.Wait(); err != nil {
|
|
klog.Warningf(util.Log(ctx, "%d is not a child process: %v"), pid, err)
|
|
}
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|