mirror of https://github.com/minio/minio.git
				
				
				
			
		
			
				
	
	
		
			940 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			Go
		
	
	
	
			
		
		
	
	
			940 lines
		
	
	
		
			29 KiB
		
	
	
	
		
			Go
		
	
	
	
/*
 | 
						|
 * MinIO Cloud Storage, (C) 2016, 2017, 2018 MinIO, Inc.
 | 
						|
 *
 | 
						|
 * Licensed under the Apache License, Version 2.0 (the "License");
 | 
						|
 * you may not use this file except in compliance with the License.
 | 
						|
 * You may obtain a copy of the License at
 | 
						|
 *
 | 
						|
 *     http://www.apache.org/licenses/LICENSE-2.0
 | 
						|
 *
 | 
						|
 * Unless required by applicable law or agreed to in writing, software
 | 
						|
 * distributed under the License is distributed on an "AS IS" BASIS,
 | 
						|
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | 
						|
 * See the License for the specific language governing permissions and
 | 
						|
 * limitations under the License.
 | 
						|
 */
 | 
						|
 | 
						|
package cmd
 | 
						|
 | 
						|
import (
 | 
						|
	"context"
 | 
						|
	"encoding/hex"
 | 
						|
	"encoding/json"
 | 
						|
	"errors"
 | 
						|
	"fmt"
 | 
						|
	"io/ioutil"
 | 
						|
	"reflect"
 | 
						|
	"sync"
 | 
						|
 | 
						|
	humanize "github.com/dustin/go-humanize"
 | 
						|
	"github.com/minio/minio/cmd/config/storageclass"
 | 
						|
	"github.com/minio/minio/cmd/logger"
 | 
						|
	"github.com/minio/minio/pkg/color"
 | 
						|
	"github.com/minio/minio/pkg/sync/errgroup"
 | 
						|
	sha256 "github.com/minio/sha256-simd"
 | 
						|
)
 | 
						|
 | 
						|
const (
 | 
						|
	// Represents Erasure backend.
 | 
						|
	formatBackendErasure = "xl"
 | 
						|
 | 
						|
	// formatErasureV1.Erasure.Version - version '1'.
 | 
						|
	formatErasureVersionV1 = "1"
 | 
						|
 | 
						|
	// formatErasureV2.Erasure.Version - version '2'.
 | 
						|
	formatErasureVersionV2 = "2"
 | 
						|
 | 
						|
	// formatErasureV3.Erasure.Version - version '3'.
 | 
						|
	formatErasureVersionV3 = "3"
 | 
						|
 | 
						|
	// Distribution algorithm used, legacy
 | 
						|
	formatErasureVersionV2DistributionAlgoLegacy = "CRCMOD"
 | 
						|
 | 
						|
	// Distributed algorithm used, current
 | 
						|
	formatErasureVersionV3DistributionAlgo = "SIPMOD"
 | 
						|
)
 | 
						|
 | 
						|
// Offline disk UUID represents an offline disk.
 | 
						|
const offlineDiskUUID = "ffffffff-ffff-ffff-ffff-ffffffffffff"
 | 
						|
 | 
						|
// Used to detect the version of "xl" format.
 | 
						|
type formatErasureVersionDetect struct {
 | 
						|
	Erasure struct {
 | 
						|
		Version string `json:"version"`
 | 
						|
	} `json:"xl"`
 | 
						|
}
 | 
						|
 | 
						|
// Represents the V1 backend disk structure version
 | 
						|
// under `.minio.sys` and actual data namespace.
 | 
						|
// formatErasureV1 - structure holds format config version '1'.
 | 
						|
type formatErasureV1 struct {
 | 
						|
	formatMetaV1
 | 
						|
	Erasure struct {
 | 
						|
		Version string `json:"version"` // Version of 'xl' format.
 | 
						|
		Disk    string `json:"disk"`    // Disk field carries assigned disk uuid.
 | 
						|
		// JBOD field carries the input disk order generated the first
 | 
						|
		// time when fresh disks were supplied.
 | 
						|
		JBOD []string `json:"jbod"`
 | 
						|
	} `json:"xl"` // Erasure field holds xl format.
 | 
						|
}
 | 
						|
 | 
						|
// Represents the V2 backend disk structure version
 | 
						|
// under `.minio.sys` and actual data namespace.
 | 
						|
// formatErasureV2 - structure holds format config version '2'.
 | 
						|
// The V2 format to support "large bucket" support where a bucket
 | 
						|
// can span multiple erasure sets.
 | 
						|
type formatErasureV2 struct {
 | 
						|
	formatMetaV1
 | 
						|
	Erasure struct {
 | 
						|
		Version string `json:"version"` // Version of 'xl' format.
 | 
						|
		This    string `json:"this"`    // This field carries assigned disk uuid.
 | 
						|
		// Sets field carries the input disk order generated the first
 | 
						|
		// time when fresh disks were supplied, it is a two dimensional
 | 
						|
		// array second dimension represents list of disks used per set.
 | 
						|
		Sets [][]string `json:"sets"`
 | 
						|
		// Distribution algorithm represents the hashing algorithm
 | 
						|
		// to pick the right set index for an object.
 | 
						|
		DistributionAlgo string `json:"distributionAlgo"`
 | 
						|
	} `json:"xl"`
 | 
						|
}
 | 
						|
 | 
						|
// formatErasureV3 struct is same as formatErasureV2 struct except that formatErasureV3.Erasure.Version is "3" indicating
 | 
						|
// the simplified multipart backend which is a flat hierarchy now.
 | 
						|
// In .minio.sys/multipart we have:
 | 
						|
// sha256(bucket/object)/uploadID/[xl.meta, part.1, part.2 ....]
 | 
						|
type formatErasureV3 struct {
 | 
						|
	formatMetaV1
 | 
						|
	Erasure struct {
 | 
						|
		Version string `json:"version"` // Version of 'xl' format.
 | 
						|
		This    string `json:"this"`    // This field carries assigned disk uuid.
 | 
						|
		// Sets field carries the input disk order generated the first
 | 
						|
		// time when fresh disks were supplied, it is a two dimensional
 | 
						|
		// array second dimension represents list of disks used per set.
 | 
						|
		Sets [][]string `json:"sets"`
 | 
						|
		// Distribution algorithm represents the hashing algorithm
 | 
						|
		// to pick the right set index for an object.
 | 
						|
		DistributionAlgo string `json:"distributionAlgo"`
 | 
						|
	} `json:"xl"`
 | 
						|
}
 | 
						|
 | 
						|
func (f *formatErasureV3) Clone() *formatErasureV3 {
 | 
						|
	b, err := json.Marshal(f)
 | 
						|
	if err != nil {
 | 
						|
		panic(err)
 | 
						|
	}
 | 
						|
	var dst formatErasureV3
 | 
						|
	if err = json.Unmarshal(b, &dst); err != nil {
 | 
						|
		panic(err)
 | 
						|
	}
 | 
						|
	return &dst
 | 
						|
}
 | 
						|
 | 
						|
// Returns formatErasure.Erasure.Version
 | 
						|
func newFormatErasureV3(numSets int, setLen int, distributionAlgo string) *formatErasureV3 {
 | 
						|
	format := &formatErasureV3{}
 | 
						|
	format.Version = formatMetaVersionV1
 | 
						|
	format.Format = formatBackendErasure
 | 
						|
	format.ID = mustGetUUID()
 | 
						|
	format.Erasure.Version = formatErasureVersionV3
 | 
						|
	if distributionAlgo == "" {
 | 
						|
		format.Erasure.DistributionAlgo = formatErasureVersionV3DistributionAlgo
 | 
						|
	} else {
 | 
						|
		format.Erasure.DistributionAlgo = distributionAlgo
 | 
						|
	}
 | 
						|
	format.Erasure.Sets = make([][]string, numSets)
 | 
						|
 | 
						|
	for i := 0; i < numSets; i++ {
 | 
						|
		format.Erasure.Sets[i] = make([]string, setLen)
 | 
						|
		for j := 0; j < setLen; j++ {
 | 
						|
			format.Erasure.Sets[i][j] = mustGetUUID()
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return format
 | 
						|
}
 | 
						|
 | 
						|
// Returns format Erasure version after reading `format.json`, returns
 | 
						|
// successfully the version only if the backend is Erasure.
 | 
						|
func formatGetBackendErasureVersion(formatPath string) (string, error) {
 | 
						|
	meta := &formatMetaV1{}
 | 
						|
	b, err := ioutil.ReadFile(formatPath)
 | 
						|
	if err != nil {
 | 
						|
		return "", err
 | 
						|
	}
 | 
						|
	if err = json.Unmarshal(b, meta); err != nil {
 | 
						|
		return "", err
 | 
						|
	}
 | 
						|
	if meta.Version != formatMetaVersionV1 {
 | 
						|
		return "", fmt.Errorf(`format.Version expected: %s, got: %s`, formatMetaVersionV1, meta.Version)
 | 
						|
	}
 | 
						|
	if meta.Format != formatBackendErasure {
 | 
						|
		return "", fmt.Errorf(`found backend type %s, expected %s`, meta.Format, formatBackendErasure)
 | 
						|
	}
 | 
						|
	// Erasure backend found, proceed to detect version.
 | 
						|
	format := &formatErasureVersionDetect{}
 | 
						|
	if err = json.Unmarshal(b, format); err != nil {
 | 
						|
		return "", err
 | 
						|
	}
 | 
						|
	return format.Erasure.Version, nil
 | 
						|
}
 | 
						|
 | 
						|
// Migrates all previous versions to latest version of `format.json`,
 | 
						|
// this code calls migration in sequence, such as V1 is migrated to V2
 | 
						|
// first before it V2 migrates to V3.n
 | 
						|
func formatErasureMigrate(export string) error {
 | 
						|
	formatPath := pathJoin(export, minioMetaBucket, formatConfigFile)
 | 
						|
	version, err := formatGetBackendErasureVersion(formatPath)
 | 
						|
	if err != nil {
 | 
						|
		return fmt.Errorf("Disk %s: %w", export, err)
 | 
						|
	}
 | 
						|
	switch version {
 | 
						|
	case formatErasureVersionV1:
 | 
						|
		if err = formatErasureMigrateV1ToV2(export, version); err != nil {
 | 
						|
			return fmt.Errorf("Disk %s: %w", export, err)
 | 
						|
		}
 | 
						|
		// Migrate successful v1 => v2, proceed to v2 => v3
 | 
						|
		version = formatErasureVersionV2
 | 
						|
		fallthrough
 | 
						|
	case formatErasureVersionV2:
 | 
						|
		if err = formatErasureMigrateV2ToV3(export, version); err != nil {
 | 
						|
			return fmt.Errorf("Disk %s: %w", export, err)
 | 
						|
		}
 | 
						|
		// Migrate successful v2 => v3, v3 is latest
 | 
						|
		// version = formatXLVersionV3
 | 
						|
		fallthrough
 | 
						|
	case formatErasureVersionV3:
 | 
						|
		// v3 is the latest version, return.
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
	return fmt.Errorf(`Disk %s: unknown format version %s`, export, version)
 | 
						|
}
 | 
						|
 | 
						|
// Migrates version V1 of format.json to version V2 of format.json,
 | 
						|
// migration fails upon any error.
 | 
						|
func formatErasureMigrateV1ToV2(export, version string) error {
 | 
						|
	if version != formatErasureVersionV1 {
 | 
						|
		return fmt.Errorf(`format version expected %s, found %s`, formatErasureVersionV1, version)
 | 
						|
	}
 | 
						|
 | 
						|
	formatPath := pathJoin(export, minioMetaBucket, formatConfigFile)
 | 
						|
 | 
						|
	formatV1 := &formatErasureV1{}
 | 
						|
	b, err := ioutil.ReadFile(formatPath)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
	if err = json.Unmarshal(b, formatV1); err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	formatV2 := &formatErasureV2{}
 | 
						|
	formatV2.Version = formatMetaVersionV1
 | 
						|
	formatV2.Format = formatBackendErasure
 | 
						|
	formatV2.Erasure.Version = formatErasureVersionV2
 | 
						|
	formatV2.Erasure.DistributionAlgo = formatErasureVersionV2DistributionAlgoLegacy
 | 
						|
	formatV2.Erasure.This = formatV1.Erasure.Disk
 | 
						|
	formatV2.Erasure.Sets = make([][]string, 1)
 | 
						|
	formatV2.Erasure.Sets[0] = make([]string, len(formatV1.Erasure.JBOD))
 | 
						|
	copy(formatV2.Erasure.Sets[0], formatV1.Erasure.JBOD)
 | 
						|
 | 
						|
	b, err = json.Marshal(formatV2)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
	return ioutil.WriteFile(formatPath, b, 0644)
 | 
						|
}
 | 
						|
 | 
						|
// Migrates V2 for format.json to V3 (Flat hierarchy for multipart)
 | 
						|
func formatErasureMigrateV2ToV3(export, version string) error {
 | 
						|
	if version != formatErasureVersionV2 {
 | 
						|
		return fmt.Errorf(`format version expected %s, found %s`, formatErasureVersionV2, version)
 | 
						|
	}
 | 
						|
 | 
						|
	formatPath := pathJoin(export, minioMetaBucket, formatConfigFile)
 | 
						|
	formatV2 := &formatErasureV2{}
 | 
						|
	b, err := ioutil.ReadFile(formatPath)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
	err = json.Unmarshal(b, formatV2)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	if err = removeAll(pathJoin(export, minioMetaMultipartBucket)); err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	if err = mkdirAll(pathJoin(export, minioMetaMultipartBucket), 0755); err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	// format-V2 struct is exactly same as format-V1 except that version is "3"
 | 
						|
	// which indicates the simplified multipart backend.
 | 
						|
	formatV3 := formatErasureV3{}
 | 
						|
 | 
						|
	formatV3.Version = formatV2.Version
 | 
						|
	formatV3.Format = formatV2.Format
 | 
						|
	formatV3.Erasure = formatV2.Erasure
 | 
						|
 | 
						|
	formatV3.Erasure.Version = formatErasureVersionV3
 | 
						|
 | 
						|
	b, err = json.Marshal(formatV3)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
	return ioutil.WriteFile(formatPath, b, 0644)
 | 
						|
}
 | 
						|
 | 
						|
// countErrs - count a specific error.
 | 
						|
func countErrs(errs []error, err error) int {
 | 
						|
	var i = 0
 | 
						|
	for _, err1 := range errs {
 | 
						|
		if err1 == err {
 | 
						|
			i++
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return i
 | 
						|
}
 | 
						|
 | 
						|
// Does all errors indicate we need to initialize all disks?.
 | 
						|
func shouldInitErasureDisks(errs []error) bool {
 | 
						|
	return countErrs(errs, errUnformattedDisk) == len(errs)
 | 
						|
}
 | 
						|
 | 
						|
// Check if unformatted disks are equal to write quorum.
 | 
						|
func quorumUnformattedDisks(errs []error) bool {
 | 
						|
	return countErrs(errs, errUnformattedDisk) >= (len(errs)/2)+1
 | 
						|
}
 | 
						|
 | 
						|
// loadFormatErasureAll - load all format config from all input disks in parallel.
 | 
						|
func loadFormatErasureAll(storageDisks []StorageAPI, heal bool) ([]*formatErasureV3, []error) {
 | 
						|
	// Initialize list of errors.
 | 
						|
	g := errgroup.WithNErrs(len(storageDisks))
 | 
						|
 | 
						|
	// Initialize format configs.
 | 
						|
	var formats = make([]*formatErasureV3, len(storageDisks))
 | 
						|
 | 
						|
	// Load format from each disk in parallel
 | 
						|
	for index := range storageDisks {
 | 
						|
		index := index
 | 
						|
		g.Go(func() error {
 | 
						|
			if storageDisks[index] == nil {
 | 
						|
				return errDiskNotFound
 | 
						|
			}
 | 
						|
			format, err := loadFormatErasure(storageDisks[index])
 | 
						|
			if err != nil {
 | 
						|
				return err
 | 
						|
			}
 | 
						|
			formats[index] = format
 | 
						|
			if !heal {
 | 
						|
				// If no healing required, make the disks valid and
 | 
						|
				// online.
 | 
						|
				storageDisks[index].SetDiskID(format.Erasure.This)
 | 
						|
			}
 | 
						|
			return nil
 | 
						|
		}, index)
 | 
						|
	}
 | 
						|
 | 
						|
	// Return all formats and errors if any.
 | 
						|
	return formats, g.Wait()
 | 
						|
}
 | 
						|
 | 
						|
func saveHealingTracker(disk StorageAPI, diskID string) error {
 | 
						|
	htracker := healingTracker{
 | 
						|
		ID: diskID,
 | 
						|
	}
 | 
						|
	htrackerBytes, err := htracker.MarshalMsg(nil)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
	return disk.WriteAll(context.TODO(), minioMetaBucket,
 | 
						|
		pathJoin(bucketMetaPrefix, slashSeparator, healingTrackerFilename),
 | 
						|
		htrackerBytes)
 | 
						|
}
 | 
						|
 | 
						|
func saveFormatErasure(disk StorageAPI, format *formatErasureV3, heal bool) error {
 | 
						|
	if disk == nil || format == nil {
 | 
						|
		return errDiskNotFound
 | 
						|
	}
 | 
						|
 | 
						|
	diskID := format.Erasure.This
 | 
						|
 | 
						|
	if err := makeFormatErasureMetaVolumes(disk); err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	// Marshal and write to disk.
 | 
						|
	formatBytes, err := json.Marshal(format)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	tmpFormat := mustGetUUID()
 | 
						|
 | 
						|
	// Purge any existing temporary file, okay to ignore errors here.
 | 
						|
	defer disk.Delete(context.TODO(), minioMetaBucket, tmpFormat, false)
 | 
						|
 | 
						|
	// write to unique file.
 | 
						|
	if err = disk.WriteAll(context.TODO(), minioMetaBucket, tmpFormat, formatBytes); err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	// Rename file `uuid.json` --> `format.json`.
 | 
						|
	if err = disk.RenameFile(context.TODO(), minioMetaBucket, tmpFormat, minioMetaBucket, formatConfigFile); err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	disk.SetDiskID(diskID)
 | 
						|
	if heal {
 | 
						|
		return saveHealingTracker(disk, diskID)
 | 
						|
	}
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
var ignoredHiddenDirectories = map[string]struct{}{
 | 
						|
	minioMetaBucket:             {}, // metabucket '.minio.sys'
 | 
						|
	".minio":                    {}, // users may choose to double down the backend as the config folder for certs
 | 
						|
	".snapshot":                 {}, // .snapshot for ignoring NetApp based persistent volumes WAFL snapshot
 | 
						|
	"lost+found":                {}, // 'lost+found' directory default on ext4 filesystems
 | 
						|
	"$RECYCLE.BIN":              {}, // windows specific directory for each drive (hidden)
 | 
						|
	"System Volume Information": {}, // windows specific directory for each drive (hidden)
 | 
						|
}
 | 
						|
 | 
						|
func isHiddenDirectories(vols ...VolInfo) bool {
 | 
						|
	for _, vol := range vols {
 | 
						|
		if _, ok := ignoredHiddenDirectories[vol.Name]; ok {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		return false
 | 
						|
	}
 | 
						|
	return true
 | 
						|
}
 | 
						|
 | 
						|
// loadFormatErasure - loads format.json from disk.
 | 
						|
func loadFormatErasure(disk StorageAPI) (format *formatErasureV3, err error) {
 | 
						|
	buf, err := disk.ReadAll(context.TODO(), minioMetaBucket, formatConfigFile)
 | 
						|
	if err != nil {
 | 
						|
		// 'file not found' and 'volume not found' as
 | 
						|
		// same. 'volume not found' usually means its a fresh disk.
 | 
						|
		if err == errFileNotFound || err == errVolumeNotFound {
 | 
						|
			var vols []VolInfo
 | 
						|
			vols, err = disk.ListVols(context.TODO())
 | 
						|
			if err != nil {
 | 
						|
				return nil, err
 | 
						|
			}
 | 
						|
			if !isHiddenDirectories(vols...) {
 | 
						|
				// 'format.json' not found, but we found user data, reject such disks.
 | 
						|
				return nil, fmt.Errorf("some unexpected files '%v' found on %s: %w",
 | 
						|
					vols, disk, errCorruptedFormat)
 | 
						|
			}
 | 
						|
			// No other data found, its a fresh disk.
 | 
						|
			return nil, errUnformattedDisk
 | 
						|
		}
 | 
						|
		return nil, err
 | 
						|
	}
 | 
						|
 | 
						|
	// Try to decode format json into formatConfigV1 struct.
 | 
						|
	format = &formatErasureV3{}
 | 
						|
	if err = json.Unmarshal(buf, format); err != nil {
 | 
						|
		return nil, err
 | 
						|
	}
 | 
						|
 | 
						|
	// Success.
 | 
						|
	return format, nil
 | 
						|
}
 | 
						|
 | 
						|
// Valid formatErasure basic versions.
 | 
						|
func checkFormatErasureValue(formatErasure *formatErasureV3) error {
 | 
						|
	// Validate format version and format type.
 | 
						|
	if formatErasure.Version != formatMetaVersionV1 {
 | 
						|
		return fmt.Errorf("Unsupported version of backend format [%s] found", formatErasure.Version)
 | 
						|
	}
 | 
						|
	if formatErasure.Format != formatBackendErasure {
 | 
						|
		return fmt.Errorf("Unsupported backend format [%s] found", formatErasure.Format)
 | 
						|
	}
 | 
						|
	if formatErasure.Erasure.Version != formatErasureVersionV3 {
 | 
						|
		return fmt.Errorf("Unsupported Erasure backend format found [%s]", formatErasure.Erasure.Version)
 | 
						|
	}
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
// Check all format values.
 | 
						|
func checkFormatErasureValues(formats []*formatErasureV3, setDriveCount int) error {
 | 
						|
	for i, formatErasure := range formats {
 | 
						|
		if formatErasure == nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		if err := checkFormatErasureValue(formatErasure); err != nil {
 | 
						|
			return err
 | 
						|
		}
 | 
						|
		if len(formats) != len(formatErasure.Erasure.Sets)*len(formatErasure.Erasure.Sets[0]) {
 | 
						|
			return fmt.Errorf("%s disk is already being used in another erasure deployment. (Number of disks specified: %d but the number of disks found in the %s disk's format.json: %d)",
 | 
						|
				humanize.Ordinal(i+1), len(formats), humanize.Ordinal(i+1), len(formatErasure.Erasure.Sets)*len(formatErasure.Erasure.Sets[0]))
 | 
						|
		}
 | 
						|
		// Only if custom erasure drive count is set,
 | 
						|
		// we should fail here other proceed to honor what
 | 
						|
		// is present on the disk.
 | 
						|
		if globalCustomErasureDriveCount && len(formatErasure.Erasure.Sets[0]) != setDriveCount {
 | 
						|
			return fmt.Errorf("%s disk is already formatted with %d drives per erasure set. This cannot be changed to %d, please revert your MINIO_ERASURE_SET_DRIVE_COUNT setting", humanize.Ordinal(i+1), len(formatErasure.Erasure.Sets[0]), setDriveCount)
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
// Get Deployment ID for the Erasure sets from format.json.
 | 
						|
// This need not be in quorum. Even if one of the format.json
 | 
						|
// file has this value, we assume it is valid.
 | 
						|
// If more than one format.json's have different id, it is considered a corrupt
 | 
						|
// backend format.
 | 
						|
func formatErasureGetDeploymentID(refFormat *formatErasureV3, formats []*formatErasureV3) (string, error) {
 | 
						|
	var deploymentID string
 | 
						|
	for _, format := range formats {
 | 
						|
		if format == nil || format.ID == "" {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		if reflect.DeepEqual(format.Erasure.Sets, refFormat.Erasure.Sets) {
 | 
						|
			// Found an ID in one of the format.json file
 | 
						|
			// Set deploymentID for the first time.
 | 
						|
			if deploymentID == "" {
 | 
						|
				deploymentID = format.ID
 | 
						|
			} else if deploymentID != format.ID {
 | 
						|
				// DeploymentID found earlier doesn't match with the
 | 
						|
				// current format.json's ID.
 | 
						|
				return "", fmt.Errorf("Deployment IDs do not match expected %s, got %s: %w",
 | 
						|
					deploymentID, format.ID, errCorruptedFormat)
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return deploymentID, nil
 | 
						|
}
 | 
						|
 | 
						|
// formatErasureFixDeploymentID - Add deployment id if it is not present.
 | 
						|
func formatErasureFixDeploymentID(endpoints Endpoints, storageDisks []StorageAPI, refFormat *formatErasureV3) (err error) {
 | 
						|
	// Attempt to load all `format.json` from all disks.
 | 
						|
	formats, _ := loadFormatErasureAll(storageDisks, false)
 | 
						|
	for index := range formats {
 | 
						|
		// If the Erasure sets do not match, set those formats to nil,
 | 
						|
		// We do not have to update the ID on those format.json file.
 | 
						|
		if formats[index] != nil && !reflect.DeepEqual(formats[index].Erasure.Sets, refFormat.Erasure.Sets) {
 | 
						|
			formats[index] = nil
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	refFormat.ID, err = formatErasureGetDeploymentID(refFormat, formats)
 | 
						|
	if err != nil {
 | 
						|
		return err
 | 
						|
	}
 | 
						|
 | 
						|
	// If ID is set, then some other node got the lock
 | 
						|
	// before this node could and generated an ID
 | 
						|
	// for the deployment. No need to generate one.
 | 
						|
	if refFormat.ID != "" {
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
 | 
						|
	// ID is generated for the first time,
 | 
						|
	// We set the ID in all the formats and update.
 | 
						|
	refFormat.ID = mustGetUUID()
 | 
						|
	for _, format := range formats {
 | 
						|
		if format != nil {
 | 
						|
			format.ID = refFormat.ID
 | 
						|
		}
 | 
						|
	}
 | 
						|
	// Deployment ID needs to be set on all the disks.
 | 
						|
	// Save `format.json` across all disks.
 | 
						|
	return saveFormatErasureAll(GlobalContext, storageDisks, formats)
 | 
						|
 | 
						|
}
 | 
						|
 | 
						|
// Update only the valid local disks which have not been updated before.
 | 
						|
func formatErasureFixLocalDeploymentID(endpoints Endpoints, storageDisks []StorageAPI, refFormat *formatErasureV3) error {
 | 
						|
	// If this server was down when the deploymentID was updated
 | 
						|
	// then we make sure that we update the local disks with the deploymentID.
 | 
						|
 | 
						|
	// Initialize errs to collect errors inside go-routine.
 | 
						|
	g := errgroup.WithNErrs(len(storageDisks))
 | 
						|
 | 
						|
	for index := range storageDisks {
 | 
						|
		index := index
 | 
						|
		g.Go(func() error {
 | 
						|
			if endpoints[index].IsLocal && storageDisks[index] != nil && storageDisks[index].IsOnline() {
 | 
						|
				format, err := loadFormatErasure(storageDisks[index])
 | 
						|
				if err != nil {
 | 
						|
					// Disk can be offline etc.
 | 
						|
					// ignore the errors seen here.
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
				if format.ID != "" {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
				if !reflect.DeepEqual(format.Erasure.Sets, refFormat.Erasure.Sets) {
 | 
						|
					return nil
 | 
						|
				}
 | 
						|
				format.ID = refFormat.ID
 | 
						|
				// Heal the drive if we fixed its deployment ID.
 | 
						|
				if err := saveFormatErasure(storageDisks[index], format, true); err != nil {
 | 
						|
					logger.LogIf(GlobalContext, err)
 | 
						|
					return fmt.Errorf("Unable to save format.json, %w", err)
 | 
						|
				}
 | 
						|
			}
 | 
						|
			return nil
 | 
						|
		}, index)
 | 
						|
	}
 | 
						|
	for _, err := range g.Wait() {
 | 
						|
		if err != nil {
 | 
						|
			return err
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
// Get backend Erasure format in quorum `format.json`.
 | 
						|
func getFormatErasureInQuorum(formats []*formatErasureV3) (*formatErasureV3, error) {
 | 
						|
	formatHashes := make([]string, len(formats))
 | 
						|
	for i, format := range formats {
 | 
						|
		if format == nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		h := sha256.New()
 | 
						|
		for _, set := range format.Erasure.Sets {
 | 
						|
			for _, diskID := range set {
 | 
						|
				h.Write([]byte(diskID))
 | 
						|
			}
 | 
						|
		}
 | 
						|
		formatHashes[i] = hex.EncodeToString(h.Sum(nil))
 | 
						|
	}
 | 
						|
 | 
						|
	formatCountMap := make(map[string]int)
 | 
						|
	for _, hash := range formatHashes {
 | 
						|
		if hash == "" {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		formatCountMap[hash]++
 | 
						|
	}
 | 
						|
 | 
						|
	maxHash := ""
 | 
						|
	maxCount := 0
 | 
						|
	for hash, count := range formatCountMap {
 | 
						|
		if count > maxCount {
 | 
						|
			maxCount = count
 | 
						|
			maxHash = hash
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	if maxCount < len(formats)/2 {
 | 
						|
		return nil, errErasureReadQuorum
 | 
						|
	}
 | 
						|
 | 
						|
	for i, hash := range formatHashes {
 | 
						|
		if hash == maxHash {
 | 
						|
			format := formats[i].Clone()
 | 
						|
			format.Erasure.This = ""
 | 
						|
			return format, nil
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	return nil, errErasureReadQuorum
 | 
						|
}
 | 
						|
 | 
						|
func formatErasureV3Check(reference *formatErasureV3, format *formatErasureV3) error {
 | 
						|
	tmpFormat := format.Clone()
 | 
						|
	this := tmpFormat.Erasure.This
 | 
						|
	tmpFormat.Erasure.This = ""
 | 
						|
	if len(reference.Erasure.Sets) != len(format.Erasure.Sets) {
 | 
						|
		return fmt.Errorf("Expected number of sets %d, got %d", len(reference.Erasure.Sets), len(format.Erasure.Sets))
 | 
						|
	}
 | 
						|
 | 
						|
	// Make sure that the sets match.
 | 
						|
	for i := range reference.Erasure.Sets {
 | 
						|
		if len(reference.Erasure.Sets[i]) != len(format.Erasure.Sets[i]) {
 | 
						|
			return fmt.Errorf("Each set should be of same size, expected %d got %d",
 | 
						|
				len(reference.Erasure.Sets[i]), len(format.Erasure.Sets[i]))
 | 
						|
		}
 | 
						|
		for j := range reference.Erasure.Sets[i] {
 | 
						|
			if reference.Erasure.Sets[i][j] != format.Erasure.Sets[i][j] {
 | 
						|
				return fmt.Errorf("UUID on positions %d:%d do not match with, expected %s got %s: (%w)",
 | 
						|
					i, j, reference.Erasure.Sets[i][j], format.Erasure.Sets[i][j], errInconsistentDisk)
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	// Make sure that the diskID is found in the set.
 | 
						|
	for i := 0; i < len(tmpFormat.Erasure.Sets); i++ {
 | 
						|
		for j := 0; j < len(tmpFormat.Erasure.Sets[i]); j++ {
 | 
						|
			if this == tmpFormat.Erasure.Sets[i][j] {
 | 
						|
				return nil
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return fmt.Errorf("Disk ID %s not found in any disk sets %s", this, format.Erasure.Sets)
 | 
						|
}
 | 
						|
 | 
						|
// Initializes meta volume only on local storage disks.
 | 
						|
func initErasureMetaVolumesInLocalDisks(storageDisks []StorageAPI, formats []*formatErasureV3) error {
 | 
						|
 | 
						|
	// Compute the local disks eligible for meta volumes (re)initialization
 | 
						|
	var disksToInit []StorageAPI
 | 
						|
	for index := range storageDisks {
 | 
						|
		if formats[index] == nil || storageDisks[index] == nil || !storageDisks[index].IsLocal() {
 | 
						|
			// Ignore create meta volume on disks which are not found or not local.
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		disksToInit = append(disksToInit, storageDisks[index])
 | 
						|
	}
 | 
						|
 | 
						|
	// Initialize errs to collect errors inside go-routine.
 | 
						|
	g := errgroup.WithNErrs(len(disksToInit))
 | 
						|
 | 
						|
	// Initialize all disks in parallel.
 | 
						|
	for index := range disksToInit {
 | 
						|
		// Initialize a new index variable in each loop so each
 | 
						|
		// goroutine will return its own instance of index variable.
 | 
						|
		index := index
 | 
						|
		g.Go(func() error {
 | 
						|
			return makeFormatErasureMetaVolumes(disksToInit[index])
 | 
						|
		}, index)
 | 
						|
	}
 | 
						|
 | 
						|
	// Return upon first error.
 | 
						|
	for _, err := range g.Wait() {
 | 
						|
		if err == nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		return toObjectErr(err, minioMetaBucket)
 | 
						|
	}
 | 
						|
 | 
						|
	// Return success here.
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
// saveUnformattedFormat - populates `format.json` on unformatted disks.
 | 
						|
// also adds `.healing.bin` on the disks which are being actively healed.
 | 
						|
func saveUnformattedFormat(ctx context.Context, storageDisks []StorageAPI, formats []*formatErasureV3) error {
 | 
						|
	for index, format := range formats {
 | 
						|
		if format == nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		if err := saveFormatErasure(storageDisks[index], format, true); err != nil {
 | 
						|
			return err
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return nil
 | 
						|
}
 | 
						|
 | 
						|
// saveFormatErasureAll - populates `format.json` on disks in its order.
 | 
						|
func saveFormatErasureAll(ctx context.Context, storageDisks []StorageAPI, formats []*formatErasureV3) error {
 | 
						|
	g := errgroup.WithNErrs(len(storageDisks))
 | 
						|
 | 
						|
	// Write `format.json` to all disks.
 | 
						|
	for index := range storageDisks {
 | 
						|
		index := index
 | 
						|
		g.Go(func() error {
 | 
						|
			if formats[index] == nil {
 | 
						|
				return errDiskNotFound
 | 
						|
			}
 | 
						|
			return saveFormatErasure(storageDisks[index], formats[index], false)
 | 
						|
		}, index)
 | 
						|
	}
 | 
						|
 | 
						|
	writeQuorum := getWriteQuorum(len(storageDisks))
 | 
						|
	// Wait for the routines to finish.
 | 
						|
	return reduceWriteQuorumErrs(ctx, g.Wait(), nil, writeQuorum)
 | 
						|
}
 | 
						|
 | 
						|
// relinquishes the underlying connection for all storage disks.
 | 
						|
func closeStorageDisks(storageDisks []StorageAPI) {
 | 
						|
	for _, disk := range storageDisks {
 | 
						|
		if disk == nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		disk.Close()
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
func initStorageDisksWithErrorsWithoutHealthCheck(endpoints Endpoints) ([]StorageAPI, []error) {
 | 
						|
	// Bootstrap disks.
 | 
						|
	storageDisks := make([]StorageAPI, len(endpoints))
 | 
						|
	g := errgroup.WithNErrs(len(endpoints))
 | 
						|
	for index := range endpoints {
 | 
						|
		index := index
 | 
						|
		g.Go(func() (err error) {
 | 
						|
			storageDisks[index], err = newStorageAPIWithoutHealthCheck(endpoints[index])
 | 
						|
			return err
 | 
						|
		}, index)
 | 
						|
	}
 | 
						|
	return storageDisks, g.Wait()
 | 
						|
}
 | 
						|
 | 
						|
// Initialize storage disks for each endpoint.
 | 
						|
// Errors are returned for each endpoint with matching index.
 | 
						|
func initStorageDisksWithErrors(endpoints Endpoints) ([]StorageAPI, []error) {
 | 
						|
	// Bootstrap disks.
 | 
						|
	storageDisks := make([]StorageAPI, len(endpoints))
 | 
						|
	g := errgroup.WithNErrs(len(endpoints))
 | 
						|
	for index := range endpoints {
 | 
						|
		index := index
 | 
						|
		g.Go(func() (err error) {
 | 
						|
			storageDisks[index], err = newStorageAPI(endpoints[index])
 | 
						|
			return err
 | 
						|
		}, index)
 | 
						|
	}
 | 
						|
	return storageDisks, g.Wait()
 | 
						|
}
 | 
						|
 | 
						|
// formatErasureV3ThisEmpty - find out if '.This' field is empty
 | 
						|
// in any of the input `formats`, if yes return true.
 | 
						|
func formatErasureV3ThisEmpty(formats []*formatErasureV3) bool {
 | 
						|
	for _, format := range formats {
 | 
						|
		if format == nil {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		// NOTE: This code is specifically needed when migrating version
 | 
						|
		// V1 to V2 to V3, in a scenario such as this we only need to handle
 | 
						|
		// single sets since we never used to support multiple sets in releases
 | 
						|
		// with V1 format version.
 | 
						|
		if len(format.Erasure.Sets) > 1 {
 | 
						|
			continue
 | 
						|
		}
 | 
						|
		if format.Erasure.This == "" {
 | 
						|
			return true
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return false
 | 
						|
}
 | 
						|
 | 
						|
// fixFormatErasureV3 - fix format Erasure configuration on all disks.
 | 
						|
func fixFormatErasureV3(storageDisks []StorageAPI, endpoints Endpoints, formats []*formatErasureV3) error {
 | 
						|
	g := errgroup.WithNErrs(len(formats))
 | 
						|
	for i := range formats {
 | 
						|
		i := i
 | 
						|
		g.Go(func() error {
 | 
						|
			if formats[i] == nil || !endpoints[i].IsLocal {
 | 
						|
				return nil
 | 
						|
			}
 | 
						|
			// NOTE: This code is specifically needed when migrating version
 | 
						|
			// V1 to V2 to V3, in a scenario such as this we only need to handle
 | 
						|
			// single sets since we never used to support multiple sets in releases
 | 
						|
			// with V1 format version.
 | 
						|
			if len(formats[i].Erasure.Sets) > 1 {
 | 
						|
				return nil
 | 
						|
			}
 | 
						|
			if formats[i].Erasure.This == "" {
 | 
						|
				formats[i].Erasure.This = formats[i].Erasure.Sets[0][i]
 | 
						|
				// Heal the drive if drive has .This empty.
 | 
						|
				if err := saveFormatErasure(storageDisks[i], formats[i], true); err != nil {
 | 
						|
					return err
 | 
						|
				}
 | 
						|
			}
 | 
						|
			return nil
 | 
						|
		}, i)
 | 
						|
	}
 | 
						|
	for _, err := range g.Wait() {
 | 
						|
		if err != nil {
 | 
						|
			return err
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return nil
 | 
						|
 | 
						|
}
 | 
						|
 | 
						|
// initFormatErasure - save Erasure format configuration on all disks.
 | 
						|
func initFormatErasure(ctx context.Context, storageDisks []StorageAPI, setCount, setDriveCount int, distributionAlgo string, deploymentID string, sErrs []error) (*formatErasureV3, error) {
 | 
						|
	format := newFormatErasureV3(setCount, setDriveCount, distributionAlgo)
 | 
						|
	formats := make([]*formatErasureV3, len(storageDisks))
 | 
						|
	wantAtMost := ecDrivesNoConfig(setDriveCount)
 | 
						|
 | 
						|
	for i := 0; i < setCount; i++ {
 | 
						|
		hostCount := make(map[string]int, setDriveCount)
 | 
						|
		for j := 0; j < setDriveCount; j++ {
 | 
						|
			disk := storageDisks[i*setDriveCount+j]
 | 
						|
			newFormat := format.Clone()
 | 
						|
			newFormat.Erasure.This = format.Erasure.Sets[i][j]
 | 
						|
			if deploymentID != "" {
 | 
						|
				newFormat.ID = deploymentID
 | 
						|
			}
 | 
						|
			hostCount[disk.Hostname()]++
 | 
						|
			formats[i*setDriveCount+j] = newFormat
 | 
						|
		}
 | 
						|
		if len(hostCount) > 0 {
 | 
						|
			var once sync.Once
 | 
						|
			for host, count := range hostCount {
 | 
						|
				if count > wantAtMost {
 | 
						|
					if host == "" {
 | 
						|
						host = "local"
 | 
						|
					}
 | 
						|
					once.Do(func() {
 | 
						|
						if len(hostCount) == 1 {
 | 
						|
							return
 | 
						|
						}
 | 
						|
						logger.Info(" * Set %v:", i+1)
 | 
						|
						for j := 0; j < setDriveCount; j++ {
 | 
						|
							disk := storageDisks[i*setDriveCount+j]
 | 
						|
							logger.Info("   - Drive: %s", disk.String())
 | 
						|
						}
 | 
						|
					})
 | 
						|
					logger.Info(color.Yellow("WARNING:")+" Host %v has more than %v drives of set. "+
 | 
						|
						"A host failure will result in data becoming unavailable.", host, wantAtMost)
 | 
						|
				}
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	// Mark all root disks down
 | 
						|
	markRootDisksAsDown(storageDisks, sErrs)
 | 
						|
 | 
						|
	// Save formats `format.json` across all disks.
 | 
						|
	if err := saveFormatErasureAll(ctx, storageDisks, formats); err != nil {
 | 
						|
		return nil, err
 | 
						|
	}
 | 
						|
 | 
						|
	return getFormatErasureInQuorum(formats)
 | 
						|
}
 | 
						|
 | 
						|
// ecDrivesNoConfig returns the erasure coded drives in a set if no config has been set.
 | 
						|
// It will attempt to read it from env variable and fall back to drives/2.
 | 
						|
func ecDrivesNoConfig(setDriveCount int) int {
 | 
						|
	ecDrives := globalStorageClass.GetParityForSC(storageclass.STANDARD)
 | 
						|
	if ecDrives == 0 {
 | 
						|
		cfg, err := storageclass.LookupConfig(nil, setDriveCount)
 | 
						|
		if err == nil {
 | 
						|
			ecDrives = cfg.Standard.Parity
 | 
						|
		}
 | 
						|
		if ecDrives == 0 {
 | 
						|
			ecDrives = setDriveCount / 2
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return ecDrives
 | 
						|
}
 | 
						|
 | 
						|
// Make Erasure backend meta volumes.
 | 
						|
func makeFormatErasureMetaVolumes(disk StorageAPI) error {
 | 
						|
	if disk == nil {
 | 
						|
		return errDiskNotFound
 | 
						|
	}
 | 
						|
	// Attempt to create MinIO internal buckets.
 | 
						|
	return disk.MakeVolBulk(context.TODO(), minioMetaBucket, minioMetaTmpBucket, minioMetaMultipartBucket, dataUsageBucket)
 | 
						|
}
 | 
						|
 | 
						|
// Initialize a new set of set formats which will be written to all disks.
 | 
						|
func newHealFormatSets(refFormat *formatErasureV3, setCount, setDriveCount int, formats []*formatErasureV3, errs []error) [][]*formatErasureV3 {
 | 
						|
	newFormats := make([][]*formatErasureV3, setCount)
 | 
						|
	for i := range refFormat.Erasure.Sets {
 | 
						|
		newFormats[i] = make([]*formatErasureV3, setDriveCount)
 | 
						|
	}
 | 
						|
	for i := range refFormat.Erasure.Sets {
 | 
						|
		for j := range refFormat.Erasure.Sets[i] {
 | 
						|
			if errors.Is(errs[i*setDriveCount+j], errUnformattedDisk) {
 | 
						|
				newFormats[i][j] = &formatErasureV3{}
 | 
						|
				newFormats[i][j].ID = refFormat.ID
 | 
						|
				newFormats[i][j].Format = refFormat.Format
 | 
						|
				newFormats[i][j].Version = refFormat.Version
 | 
						|
				newFormats[i][j].Erasure.This = refFormat.Erasure.Sets[i][j]
 | 
						|
				newFormats[i][j].Erasure.Sets = refFormat.Erasure.Sets
 | 
						|
				newFormats[i][j].Erasure.Version = refFormat.Erasure.Version
 | 
						|
				newFormats[i][j].Erasure.DistributionAlgo = refFormat.Erasure.DistributionAlgo
 | 
						|
			}
 | 
						|
		}
 | 
						|
	}
 | 
						|
	return newFormats
 | 
						|
}
 |