/* Copyright 2019 The Kubernetes Authors. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ package plugins import ( "fmt" "strconv" "strings" v1 "k8s.io/api/core/v1" storage "k8s.io/api/storage/v1" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/apimachinery/pkg/util/sets" ) const ( // GCEPDDriverName is the name of the CSI driver for GCE PD GCEPDDriverName = "pd.csi.storage.gke.io" // GCEPDInTreePluginName is the name of the intree plugin for GCE PD GCEPDInTreePluginName = "kubernetes.io/gce-pd" // GCEPDTopologyKey is the zonal topology key for GCE PD CSI Driver GCEPDTopologyKey = "topology.gke.io/zone" // Volume ID Expected Format // "projects/{projectName}/zones/{zoneName}/disks/{diskName}" volIDZonalFmt = "projects/%s/zones/%s/disks/%s" // "projects/{projectName}/regions/{regionName}/disks/{diskName}" volIDRegionalFmt = "projects/%s/regions/%s/disks/%s" volIDProjectValue = 1 volIDRegionalityValue = 2 volIDZoneValue = 3 volIDDiskNameValue = 5 volIDTotalElements = 6 nodeIDFmt = "projects/%s/zones/%s/instances/%s" // UnspecifiedValue is used for an unknown zone string UnspecifiedValue = "UNSPECIFIED" ) var _ InTreePlugin = &gcePersistentDiskCSITranslator{} // gcePersistentDiskCSITranslator handles translation of PV spec from In-tree // GCE PD to CSI GCE PD and vice versa type gcePersistentDiskCSITranslator struct{} // NewGCEPersistentDiskCSITranslator returns a new instance of gcePersistentDiskTranslator func NewGCEPersistentDiskCSITranslator() InTreePlugin { return &gcePersistentDiskCSITranslator{} } func generateToplogySelectors(key string, values []string) []v1.TopologySelectorTerm { return []v1.TopologySelectorTerm{ { MatchLabelExpressions: []v1.TopologySelectorLabelRequirement{ { Key: key, Values: values, }, }, }, } } // TranslateInTreeStorageClassParametersToCSI translates InTree GCE storage class parameters to CSI storage class func (g *gcePersistentDiskCSITranslator) TranslateInTreeStorageClassToCSI(sc *storage.StorageClass) (*storage.StorageClass, error) { var generatedTopologies []v1.TopologySelectorTerm np := map[string]string{} for k, v := range sc.Parameters { switch strings.ToLower(k) { case fsTypeKey: // prefixed fstype parameter is stripped out by external provisioner np[csiFsTypeKey] = v // Strip out zone and zones parameters and translate them into topologies instead case zoneKey: generatedTopologies = generateToplogySelectors(GCEPDTopologyKey, []string{v}) case zonesKey: generatedTopologies = generateToplogySelectors(GCEPDTopologyKey, strings.Split(v, ",")) default: np[k] = v } } if len(generatedTopologies) > 0 && len(sc.AllowedTopologies) > 0 { return nil, fmt.Errorf("cannot simultaneously set allowed topologies and zone/zones parameters") } else if len(generatedTopologies) > 0 { sc.AllowedTopologies = generatedTopologies } else if len(sc.AllowedTopologies) > 0 { newTopologies, err := translateAllowedTopologies(sc.AllowedTopologies, GCEPDTopologyKey) if err != nil { return nil, fmt.Errorf("failed translating allowed topologies: %v", err) } sc.AllowedTopologies = newTopologies } sc.Parameters = np return sc, nil } // backwardCompatibleAccessModes translates all instances of ReadWriteMany // access mode from the in-tree plugin to ReadWriteOnce. This is because in-tree // plugin never supported ReadWriteMany but also did not validate or enforce // this access mode for pre-provisioned volumes. The GCE PD CSI Driver validates // and enforces (fails) ReadWriteMany. Therefore we treat all in-tree // ReadWriteMany as ReadWriteOnce volumes to not break legacy volumes. It also // takes [ReadWriteOnce, ReadOnlyMany] and makes it ReadWriteOnce. This is // because the in-tree plugin does not enforce access modes and just attaches // the disk in ReadWriteOnce mode; however, the CSI external-attacher will fail // this combination because technically [ReadWriteOnce, ReadOnlyMany] is not // supportable on an attached volume // See: https://github.com/kubernetes-csi/external-attacher/issues/153 func backwardCompatibleAccessModes(ams []v1.PersistentVolumeAccessMode) []v1.PersistentVolumeAccessMode { if ams == nil { return nil } s := map[v1.PersistentVolumeAccessMode]bool{} var newAM []v1.PersistentVolumeAccessMode for _, am := range ams { if am == v1.ReadWriteMany { // ReadWriteMany is unsupported in CSI, but in-tree did no // validation and treated it as ReadWriteOnce s[v1.ReadWriteOnce] = true } else { s[am] = true } } switch { case s[v1.ReadOnlyMany] && s[v1.ReadWriteOnce]: // ROX,RWO is unsupported in CSI, but in-tree did not validation and // treated it as ReadWriteOnce newAM = []v1.PersistentVolumeAccessMode{v1.ReadWriteOnce} case s[v1.ReadWriteOnce]: newAM = []v1.PersistentVolumeAccessMode{v1.ReadWriteOnce} case s[v1.ReadOnlyMany]: newAM = []v1.PersistentVolumeAccessMode{v1.ReadOnlyMany} default: newAM = []v1.PersistentVolumeAccessMode{v1.ReadWriteOnce} } return newAM } // TranslateInTreeInlineVolumeToCSI takes a Volume with GCEPersistentDisk set from in-tree // and converts the GCEPersistentDisk source to a CSIPersistentVolumeSource func (g *gcePersistentDiskCSITranslator) TranslateInTreeInlineVolumeToCSI(volume *v1.Volume) (*v1.PersistentVolume, error) { if volume == nil || volume.GCEPersistentDisk == nil { return nil, fmt.Errorf("volume is nil or GCE PD not defined on volume") } pdSource := volume.GCEPersistentDisk partition := "" if pdSource.Partition != 0 { partition = strconv.Itoa(int(pdSource.Partition)) } var am v1.PersistentVolumeAccessMode if pdSource.ReadOnly { am = v1.ReadOnlyMany } else { am = v1.ReadWriteOnce } fsMode := v1.PersistentVolumeFilesystem return &v1.PersistentVolume{ ObjectMeta: metav1.ObjectMeta{ // Must be unique per disk as it is used as the unique part of the // staging path Name: fmt.Sprintf("%s-%s", GCEPDDriverName, pdSource.PDName), }, Spec: v1.PersistentVolumeSpec{ PersistentVolumeSource: v1.PersistentVolumeSource{ CSI: &v1.CSIPersistentVolumeSource{ Driver: GCEPDDriverName, VolumeHandle: fmt.Sprintf(volIDZonalFmt, UnspecifiedValue, UnspecifiedValue, pdSource.PDName), ReadOnly: pdSource.ReadOnly, FSType: pdSource.FSType, VolumeAttributes: map[string]string{ "partition": partition, }, }, }, AccessModes: []v1.PersistentVolumeAccessMode{am}, VolumeMode: &fsMode, }, }, nil } // TranslateInTreePVToCSI takes a PV with GCEPersistentDisk set from in-tree // and converts the GCEPersistentDisk source to a CSIPersistentVolumeSource func (g *gcePersistentDiskCSITranslator) TranslateInTreePVToCSI(pv *v1.PersistentVolume) (*v1.PersistentVolume, error) { var volID string if pv == nil || pv.Spec.GCEPersistentDisk == nil { return nil, fmt.Errorf("pv is nil or GCE Persistent Disk source not defined on pv") } // depend on which version it migrates from, the label could be failuredomain beta or topology GA version zonesLabel := pv.Labels[v1.LabelFailureDomainBetaZone] if zonesLabel == "" { zonesLabel = pv.Labels[v1.LabelTopologyZone] } zones := strings.Split(zonesLabel, labelMultiZoneDelimiter) if len(zones) == 1 && len(zones[0]) != 0 { // Zonal volID = fmt.Sprintf(volIDZonalFmt, UnspecifiedValue, zones[0], pv.Spec.GCEPersistentDisk.PDName) } else if len(zones) > 1 { // Regional region, err := gceGetRegionFromZones(zones) if err != nil { return nil, fmt.Errorf("failed to get region from zones: %v", err) } volID = fmt.Sprintf(volIDRegionalFmt, UnspecifiedValue, region, pv.Spec.GCEPersistentDisk.PDName) } else { // Unspecified volID = fmt.Sprintf(volIDZonalFmt, UnspecifiedValue, UnspecifiedValue, pv.Spec.GCEPersistentDisk.PDName) } gceSource := pv.Spec.PersistentVolumeSource.GCEPersistentDisk partition := "" if gceSource.Partition != 0 { partition = strconv.Itoa(int(gceSource.Partition)) } csiSource := &v1.CSIPersistentVolumeSource{ Driver: GCEPDDriverName, VolumeHandle: volID, ReadOnly: gceSource.ReadOnly, FSType: gceSource.FSType, VolumeAttributes: map[string]string{ "partition": partition, }, } if err := translateTopologyFromInTreeToCSI(pv, GCEPDTopologyKey); err != nil { return nil, fmt.Errorf("failed to translate topology: %v", err) } pv.Spec.PersistentVolumeSource.GCEPersistentDisk = nil pv.Spec.PersistentVolumeSource.CSI = csiSource pv.Spec.AccessModes = backwardCompatibleAccessModes(pv.Spec.AccessModes) return pv, nil } // TranslateCSIPVToInTree takes a PV with CSIPersistentVolumeSource set and // translates the GCE PD CSI source to a GCEPersistentDisk source. func (g *gcePersistentDiskCSITranslator) TranslateCSIPVToInTree(pv *v1.PersistentVolume) (*v1.PersistentVolume, error) { if pv == nil || pv.Spec.CSI == nil { return nil, fmt.Errorf("pv is nil or CSI source not defined on pv") } csiSource := pv.Spec.CSI pdName, err := pdNameFromVolumeID(csiSource.VolumeHandle) if err != nil { return nil, err } gceSource := &v1.GCEPersistentDiskVolumeSource{ PDName: pdName, FSType: csiSource.FSType, ReadOnly: csiSource.ReadOnly, } if partition, ok := csiSource.VolumeAttributes["partition"]; ok && partition != "" { partInt, err := strconv.Atoi(partition) if err != nil { return nil, fmt.Errorf("Failed to convert partition %v to integer: %v", partition, err) } gceSource.Partition = int32(partInt) } // translate CSI topology to In-tree topology for rollback compatibility if err := translateTopologyFromCSIToInTree(pv, GCEPDTopologyKey, gceGetRegionFromZones); err != nil { return nil, fmt.Errorf("failed to translate topology. PV:%+v. Error:%v", *pv, err) } pv.Spec.CSI = nil pv.Spec.GCEPersistentDisk = gceSource return pv, nil } // CanSupport tests whether the plugin supports a given persistent volume // specification from the API. The spec pointer should be considered // const. func (g *gcePersistentDiskCSITranslator) CanSupport(pv *v1.PersistentVolume) bool { return pv != nil && pv.Spec.GCEPersistentDisk != nil } // CanSupportInline tests whether the plugin supports a given inline volume // specification from the API. The spec pointer should be considered // const. func (g *gcePersistentDiskCSITranslator) CanSupportInline(volume *v1.Volume) bool { return volume != nil && volume.GCEPersistentDisk != nil } // GetInTreePluginName returns the name of the intree plugin driver func (g *gcePersistentDiskCSITranslator) GetInTreePluginName() string { return GCEPDInTreePluginName } // GetCSIPluginName returns the name of the CSI plugin func (g *gcePersistentDiskCSITranslator) GetCSIPluginName() string { return GCEPDDriverName } // RepairVolumeHandle returns a fully specified volume handle by inferring // project, zone/region from the node ID if the volume handle has UNSPECIFIED // sections func (g *gcePersistentDiskCSITranslator) RepairVolumeHandle(volumeHandle, nodeID string) (string, error) { var err error tok := strings.Split(volumeHandle, "/") if len(tok) < volIDTotalElements { return "", fmt.Errorf("volume handle has wrong number of elements; got %v, wanted %v or more", len(tok), volIDTotalElements) } if tok[volIDProjectValue] != UnspecifiedValue { return volumeHandle, nil } nodeTok := strings.Split(nodeID, "/") if len(nodeTok) < volIDTotalElements { return "", fmt.Errorf("node handle has wrong number of elements; got %v, wanted %v or more", len(nodeTok), volIDTotalElements) } switch tok[volIDRegionalityValue] { case "zones": zone := "" if tok[volIDZoneValue] == UnspecifiedValue { zone = nodeTok[volIDZoneValue] } else { zone = tok[volIDZoneValue] } return fmt.Sprintf(volIDZonalFmt, nodeTok[volIDProjectValue], zone, tok[volIDDiskNameValue]), nil case "regions": region := "" if tok[volIDZoneValue] == UnspecifiedValue { region, err = gceGetRegionFromZones([]string{nodeTok[volIDZoneValue]}) if err != nil { return "", fmt.Errorf("failed to get region from zone %s: %v", nodeTok[volIDZoneValue], err) } } else { region = tok[volIDZoneValue] } return fmt.Sprintf(volIDRegionalFmt, nodeTok[volIDProjectValue], region, tok[volIDDiskNameValue]), nil default: return "", fmt.Errorf("expected volume handle to have zones or regions regionality value, got: %s", tok[volIDRegionalityValue]) } } func pdNameFromVolumeID(id string) (string, error) { splitID := strings.Split(id, "/") if len(splitID) < volIDTotalElements { return "", fmt.Errorf("failed to get id components.Got: %v, wanted %v components or more. ", len(splitID), volIDTotalElements) } return splitID[volIDDiskNameValue], nil } // TODO: Replace this with the imported one from GCE PD CSI Driver when // the driver removes all k8s/k8s dependencies func gceGetRegionFromZones(zones []string) (string, error) { regions := sets.String{} if len(zones) < 1 { return "", fmt.Errorf("no zones specified") } for _, zone := range zones { // Zone expected format {locale}-{region}-{zone} splitZone := strings.Split(zone, "-") if len(splitZone) != 3 { return "", fmt.Errorf("zone in unexpected format, expected: {locale}-{region}-{zone}, got: %v", zone) } regions.Insert(strings.Join(splitZone[0:2], "-")) } if regions.Len() != 1 { return "", fmt.Errorf("multiple or no regions gotten from zones, got: %v", regions) } return regions.UnsortedList()[0], nil }