mirror of https://github.com/minio/minio.git
				
				
				
			
		
			
	
	
		
			876 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			Go
		
	
	
	
		
		
			
		
	
	
			876 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			Go
		
	
	
	
|  | /* | ||
|  |  * Minio Cloud Storage, (C) 2016 Minio, Inc. | ||
|  |  * | ||
|  |  * Licensed under the Apache License, Version 2.0 (the "License"); | ||
|  |  * you may not use this file except in compliance with the License. | ||
|  |  * You may obtain a copy of the License at | ||
|  |  * | ||
|  |  *     http://www.apache.org/licenses/LICENSE-2.0
 | ||
|  |  * | ||
|  |  * Unless required by applicable law or agreed to in writing, software | ||
|  |  * distributed under the License is distributed on an "AS IS" BASIS, | ||
|  |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
|  |  * See the License for the specific language governing permissions and | ||
|  |  * limitations under the License. | ||
|  |  */ | ||
|  | 
 | ||
|  | package cmd | ||
|  | 
 | ||
|  | import ( | ||
|  | 	"encoding/json" | ||
|  | 	"errors" | ||
|  | 	"fmt" | ||
|  | 	"reflect" | ||
|  | 	"sync" | ||
|  | ) | ||
|  | 
 | ||
|  | // fsFormat - structure holding 'fs' format.
 | ||
|  | type fsFormat struct { | ||
|  | 	Version string `json:"version"` | ||
|  | } | ||
|  | 
 | ||
|  | // xlFormat - structure holding 'xl' format.
 | ||
|  | type xlFormat struct { | ||
|  | 	Version string `json:"version"` // Version of 'xl' format.
 | ||
|  | 	Disk    string `json:"disk"`    // Disk field carries assigned disk uuid.
 | ||
|  | 	// JBOD field carries the input disk order generated the first
 | ||
|  | 	// time when fresh disks were supplied.
 | ||
|  | 	JBOD []string `json:"jbod"` | ||
|  | } | ||
|  | 
 | ||
|  | // formatConfigV1 - structure holds format config version '1'.
 | ||
|  | type formatConfigV1 struct { | ||
|  | 	Version string `json:"version"` // Version of the format config.
 | ||
|  | 	// Format indicates the backend format type, supports two values 'xl' and 'fs'.
 | ||
|  | 	Format string    `json:"format"` | ||
|  | 	FS     *fsFormat `json:"fs,omitempty"` // FS field holds fs format.
 | ||
|  | 	XL     *xlFormat `json:"xl,omitempty"` // XL field holds xl format.
 | ||
|  | } | ||
|  | 
 | ||
|  | /* | ||
|  | 
 | ||
|  | All disks online | ||
|  | ----------------- | ||
|  | - All Unformatted - format all and return success. | ||
|  | - Some Unformatted - format all and return success. | ||
|  | - Any JBOD inconsistent - return failure // Requires deep inspection, phase2.
 | ||
|  | - Some are corrupt (missing format.json) - return failure  // Requires deep inspection, phase2.
 | ||
|  | - Any unrecognized disks - return failure | ||
|  | 
 | ||
|  | Some disks are offline and we have quorum. | ||
|  | ----------------- | ||
|  | - Some unformatted - no heal, return success. | ||
|  | - Any JBOD inconsistent - return failure // Requires deep inspection, phase2.
 | ||
|  | - Some are corrupt (missing format.json) - return failure  // Requires deep inspection, phase2.
 | ||
|  | - Any unrecognized disks - return failure | ||
|  | 
 | ||
|  | No read quorum | ||
|  | ----------------- | ||
|  | failure for all cases. | ||
|  | 
 | ||
|  | // Pseudo code for managing `format.json`.
 | ||
|  | 
 | ||
|  | // Generic checks.
 | ||
|  | if (no quorum) return error | ||
|  | if (any disk is corrupt) return error // phase2
 | ||
|  | if (jbod inconsistent) return error // phase2
 | ||
|  | if (disks not recognized) // Always error.
 | ||
|  | 
 | ||
|  | // Specific checks.
 | ||
|  | if (all disks online) | ||
|  |   if (all disks return format.json) | ||
|  |      if (jbod consistent) | ||
|  |         if (all disks recognized) | ||
|  |           return | ||
|  |   else | ||
|  |      if (all disks return format.json not found) | ||
|  |         (initialize format) | ||
|  |         return | ||
|  |      else (some disks return format.json not found) | ||
|  |         (heal format) | ||
|  |         return | ||
|  |      fi | ||
|  |    fi | ||
|  | else // No healing at this point forward, some disks are offline or dead.
 | ||
|  |    if (some disks return format.json not found) | ||
|  |       if (with force) | ||
|  |          // Offline disks are marked as dead.
 | ||
|  |          (heal format) // Offline disks should be marked as dead.
 | ||
|  |          return success | ||
|  |       else (without force) | ||
|  |          // --force is necessary to heal few drives, because some drives
 | ||
|  |          // are offline. Offline disks will be marked as dead.
 | ||
|  |          return error | ||
|  |       fi | ||
|  | fi | ||
|  | */ | ||
|  | 
 | ||
|  | // error returned when some disks are found to be unformatted.
 | ||
|  | var errSomeDiskUnformatted = errors.New("some disks are found to be unformatted") | ||
|  | 
 | ||
|  | // error returned when some disks are offline.
 | ||
|  | var errSomeDiskOffline = errors.New("some disks are offline") | ||
|  | 
 | ||
|  | // errDiskOrderMismatch - returned when disk UUID is not in consistent JBOD order.
 | ||
|  | var errDiskOrderMismatch = errors.New("disk order mismatch") | ||
|  | 
 | ||
|  | // Returns error slice into understandable errors.
 | ||
|  | func reduceFormatErrs(errs []error, diskCount int) (err error) { | ||
|  | 	var errUnformattedDiskCount = 0 | ||
|  | 	var errDiskNotFoundCount = 0 | ||
|  | 	var errCorruptedFormatCount = 0 | ||
|  | 	for _, dErr := range errs { | ||
|  | 		if dErr == errUnformattedDisk { | ||
|  | 			errUnformattedDiskCount++ | ||
|  | 		} else if dErr == errDiskNotFound { | ||
|  | 			errDiskNotFoundCount++ | ||
|  | 		} else if dErr == errCorruptedFormat { | ||
|  | 			errCorruptedFormatCount++ | ||
|  | 		} | ||
|  | 	} | ||
|  | 	if errCorruptedFormatCount > 0 { | ||
|  | 		return errCorruptedFormat | ||
|  | 	} | ||
|  | 	// Unformatted disks found, we need to figure out if any disks are offline.
 | ||
|  | 	if errUnformattedDiskCount > 0 { | ||
|  | 		// Returns errUnformattedDisk if all disks report unFormattedDisk.
 | ||
|  | 		if errUnformattedDiskCount < diskCount { | ||
|  | 			if errDiskNotFoundCount > 0 { | ||
|  | 				// Only some disks are fresh but some disks are offline as well.
 | ||
|  | 				return errSomeDiskOffline | ||
|  | 			} | ||
|  | 			// Some disks are fresh disks an unformatted, not disks are offline.
 | ||
|  | 			return errSomeDiskUnformatted | ||
|  | 		} | ||
|  | 		// All disks returned unformatted, all disks must be fresh.
 | ||
|  | 		return errUnformattedDisk | ||
|  | 	} | ||
|  | 	// No unformatted disks found no need to handle disk not found case, return success here.
 | ||
|  | 	return nil | ||
|  | } | ||
|  | 
 | ||
|  | // loadAllFormats - load all format config from all input disks in parallel.
 | ||
|  | func loadAllFormats(bootstrapDisks []StorageAPI) ([]*formatConfigV1, []error) { | ||
|  | 	// Initialize sync waitgroup.
 | ||
|  | 	var wg = &sync.WaitGroup{} | ||
|  | 
 | ||
|  | 	// Initialize list of errors.
 | ||
|  | 	var sErrs = make([]error, len(bootstrapDisks)) | ||
|  | 
 | ||
|  | 	// Initialize format configs.
 | ||
|  | 	var formatConfigs = make([]*formatConfigV1, len(bootstrapDisks)) | ||
|  | 
 | ||
|  | 	// Make a volume entry on all underlying storage disks.
 | ||
|  | 	for index, disk := range bootstrapDisks { | ||
|  | 		if disk == nil { | ||
|  | 			sErrs[index] = errDiskNotFound | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		wg.Add(1) | ||
|  | 		// Make a volume inside a go-routine.
 | ||
|  | 		go func(index int, disk StorageAPI) { | ||
|  | 			defer wg.Done() | ||
|  | 			formatConfig, lErr := loadFormat(disk) | ||
|  | 			if lErr != nil { | ||
|  | 				sErrs[index] = lErr | ||
|  | 				return | ||
|  | 			} | ||
|  | 			formatConfigs[index] = formatConfig | ||
|  | 		}(index, disk) | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Wait for all make vol to finish.
 | ||
|  | 	wg.Wait() | ||
|  | 
 | ||
|  | 	for _, err := range sErrs { | ||
|  | 		if err != nil { | ||
|  | 			// Return all formats and errors.
 | ||
|  | 			return formatConfigs, sErrs | ||
|  | 		} | ||
|  | 	} | ||
|  | 	// Return all formats and nil
 | ||
|  | 	return formatConfigs, nil | ||
|  | } | ||
|  | 
 | ||
|  | // genericFormatCheck - validates and returns error.
 | ||
|  | // if (no quorum) return error
 | ||
|  | // if (any disk is corrupt) return error // phase2
 | ||
|  | // if (jbod inconsistent) return error // phase2
 | ||
|  | // if (disks not recognized) // Always error.
 | ||
|  | func genericFormatCheck(formatConfigs []*formatConfigV1, sErrs []error) (err error) { | ||
|  | 	// Calculate the errors.
 | ||
|  | 	var ( | ||
|  | 		errCorruptFormatCount = 0 | ||
|  | 		errCount              = 0 | ||
|  | 	) | ||
|  | 
 | ||
|  | 	// Through all errors calculate the actual errors.
 | ||
|  | 	for _, lErr := range sErrs { | ||
|  | 		if lErr == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		// These errors are good conditions, means disk is online.
 | ||
|  | 		if lErr == errUnformattedDisk || lErr == errVolumeNotFound { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		if lErr == errCorruptedFormat { | ||
|  | 			errCorruptFormatCount++ | ||
|  | 		} else { | ||
|  | 			errCount++ | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Calculate read quorum.
 | ||
|  | 	readQuorum := len(formatConfigs)/2 + 1 | ||
|  | 
 | ||
|  | 	// Validate the err count under tolerant limit.
 | ||
|  | 	if errCount > len(formatConfigs)-readQuorum { | ||
|  | 		return errXLReadQuorum | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Check if number of corrupted format under quorum
 | ||
|  | 	if errCorruptFormatCount > len(formatConfigs)-readQuorum { | ||
|  | 		return errCorruptedFormat | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Validates if format and JBOD are consistent across all disks.
 | ||
|  | 	if err = checkFormatXL(formatConfigs); err != nil { | ||
|  | 		return err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Success..
 | ||
|  | 	return nil | ||
|  | } | ||
|  | 
 | ||
|  | // isSavedUUIDInOrder - validates if disk uuid is present and valid in all
 | ||
|  | // available format config JBOD. This function also validates if the disk UUID
 | ||
|  | // is always available on all JBOD under the same order.
 | ||
|  | func isSavedUUIDInOrder(uuid string, formatConfigs []*formatConfigV1) bool { | ||
|  | 	var orderIndexes []int | ||
|  | 	// Validate each for format.json for relevant uuid.
 | ||
|  | 	for _, formatConfig := range formatConfigs { | ||
|  | 		if formatConfig == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		// Validate if UUID is present in JBOD.
 | ||
|  | 		uuidIndex := findDiskIndex(uuid, formatConfig.XL.JBOD) | ||
|  | 		if uuidIndex == -1 { | ||
|  | 			// UUID not found.
 | ||
|  | 			errorIf(errDiskNotFound, "Disk %s not found in JBOD list", uuid) | ||
|  | 			return false | ||
|  | 		} | ||
|  | 		// Save the position of UUID present in JBOD.
 | ||
|  | 		orderIndexes = append(orderIndexes, uuidIndex+1) | ||
|  | 	} | ||
|  | 	// Once uuid is found, verify if the uuid
 | ||
|  | 	// present in same order across all format configs.
 | ||
|  | 	prevOrderIndex := orderIndexes[0] | ||
|  | 	for _, orderIndex := range orderIndexes { | ||
|  | 		if prevOrderIndex != orderIndex { | ||
|  | 			errorIf(errDiskOrderMismatch, "Disk %s is in wrong order wanted %d, saw %d ", uuid, prevOrderIndex, orderIndex) | ||
|  | 			return false | ||
|  | 		} | ||
|  | 	} | ||
|  | 	// Returns success, when we have verified if uuid
 | ||
|  | 	// is consistent and valid across all format configs.
 | ||
|  | 	return true | ||
|  | } | ||
|  | 
 | ||
|  | // checkDisksConsistency - checks if all disks are consistent with all JBOD entries on all disks.
 | ||
|  | func checkDisksConsistency(formatConfigs []*formatConfigV1) error { | ||
|  | 	var disks = make([]string, len(formatConfigs)) | ||
|  | 	// Collect currently available disk uuids.
 | ||
|  | 	for index, formatConfig := range formatConfigs { | ||
|  | 		if formatConfig == nil { | ||
|  | 			disks[index] = "" | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		disks[index] = formatConfig.XL.Disk | ||
|  | 	} | ||
|  | 	// Validate collected uuids and verify JBOD.
 | ||
|  | 	for _, uuid := range disks { | ||
|  | 		if uuid == "" { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		// Is uuid present on all JBOD ?.
 | ||
|  | 		if !isSavedUUIDInOrder(uuid, formatConfigs) { | ||
|  | 			return fmt.Errorf("%s disk not found in JBOD", uuid) | ||
|  | 		} | ||
|  | 	} | ||
|  | 	return nil | ||
|  | } | ||
|  | 
 | ||
|  | // checkJBODConsistency - validate xl jbod order if they are consistent.
 | ||
|  | func checkJBODConsistency(formatConfigs []*formatConfigV1) error { | ||
|  | 	var sentinelJBOD []string | ||
|  | 	// Extract first valid JBOD.
 | ||
|  | 	for _, format := range formatConfigs { | ||
|  | 		if format == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		sentinelJBOD = format.XL.JBOD | ||
|  | 		break | ||
|  | 	} | ||
|  | 	for _, format := range formatConfigs { | ||
|  | 		if format == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		currentJBOD := format.XL.JBOD | ||
|  | 		if !reflect.DeepEqual(sentinelJBOD, currentJBOD) { | ||
|  | 			return errors.New("Inconsistent JBOD found.") | ||
|  | 		} | ||
|  | 	} | ||
|  | 	return nil | ||
|  | } | ||
|  | 
 | ||
|  | // findDiskIndex returns position of disk in JBOD.
 | ||
|  | func findDiskIndex(disk string, jbod []string) int { | ||
|  | 	for index, uuid := range jbod { | ||
|  | 		if uuid == disk { | ||
|  | 			return index | ||
|  | 		} | ||
|  | 	} | ||
|  | 	return -1 | ||
|  | } | ||
|  | 
 | ||
|  | // reorderDisks - reorder disks in JBOD order.
 | ||
|  | func reorderDisks(bootstrapDisks []StorageAPI, formatConfigs []*formatConfigV1) ([]StorageAPI, error) { | ||
|  | 	var savedJBOD []string | ||
|  | 	for _, format := range formatConfigs { | ||
|  | 		if format == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		savedJBOD = format.XL.JBOD | ||
|  | 		break | ||
|  | 	} | ||
|  | 	// Pick the first JBOD list to verify the order and construct new set of disk slice.
 | ||
|  | 	var newDisks = make([]StorageAPI, len(bootstrapDisks)) | ||
|  | 	for fIndex, format := range formatConfigs { | ||
|  | 		if format == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		jIndex := findDiskIndex(format.XL.Disk, savedJBOD) | ||
|  | 		if jIndex == -1 { | ||
|  | 			return nil, errors.New("Unrecognized uuid " + format.XL.Disk + " found") | ||
|  | 		} | ||
|  | 		newDisks[jIndex] = bootstrapDisks[fIndex] | ||
|  | 	} | ||
|  | 	return newDisks, nil | ||
|  | } | ||
|  | 
 | ||
|  | // loadFormat - loads format.json from disk.
 | ||
|  | func loadFormat(disk StorageAPI) (format *formatConfigV1, err error) { | ||
|  | 	buf, err := disk.ReadAll(minioMetaBucket, formatConfigFile) | ||
|  | 	if err != nil { | ||
|  | 		// 'file not found' and 'volume not found' as
 | ||
|  | 		// same. 'volume not found' usually means its a fresh disk.
 | ||
|  | 		if err == errFileNotFound || err == errVolumeNotFound { | ||
|  | 			var vols []VolInfo | ||
|  | 			vols, err = disk.ListVols() | ||
|  | 			if err != nil { | ||
|  | 				return nil, err | ||
|  | 			} | ||
|  | 			if len(vols) > 1 { | ||
|  | 				// 'format.json' not found, but we found user data.
 | ||
|  | 				return nil, errCorruptedFormat | ||
|  | 			} | ||
|  | 			// No other data found, its a fresh disk.
 | ||
|  | 			return nil, errUnformattedDisk | ||
|  | 		} | ||
|  | 		return nil, err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Try to decode format json into formatConfigV1 struct.
 | ||
|  | 	format = &formatConfigV1{} | ||
|  | 	if err = json.Unmarshal(buf, format); err != nil { | ||
|  | 		return nil, err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Success.
 | ||
|  | 	return format, nil | ||
|  | } | ||
|  | 
 | ||
|  | // isFormatNotFound - returns true if all `format.json` are not
 | ||
|  | // found on all disks.
 | ||
|  | func isFormatNotFound(formats []*formatConfigV1) bool { | ||
|  | 	for _, format := range formats { | ||
|  | 		// One of the `format.json` is found.
 | ||
|  | 		if format != nil { | ||
|  | 			return false | ||
|  | 		} | ||
|  | 	} | ||
|  | 	// All format.json missing, success.
 | ||
|  | 	return true | ||
|  | } | ||
|  | 
 | ||
|  | // isFormatFound - returns true if all input formats are found on
 | ||
|  | // all disks.
 | ||
|  | func isFormatFound(formats []*formatConfigV1) bool { | ||
|  | 	for _, format := range formats { | ||
|  | 		// One of `format.json` is not found.
 | ||
|  | 		if format == nil { | ||
|  | 			return false | ||
|  | 		} | ||
|  | 	} | ||
|  | 	// All format.json present, success.
 | ||
|  | 	return true | ||
|  | } | ||
|  | 
 | ||
|  | // Heals any missing format.json on the drives. Returns error only for unexpected errors
 | ||
|  | // as regular errors can be ignored since there might be enough quorum to be operational.
 | ||
|  | // Heals only fresh disks.
 | ||
|  | func healFormatXLFreshDisks(storageDisks []StorageAPI) error { | ||
|  | 	formatConfigs := make([]*formatConfigV1, len(storageDisks)) | ||
|  | 	var referenceConfig *formatConfigV1 | ||
|  | 	// Loads `format.json` from all disks.
 | ||
|  | 	for index, disk := range storageDisks { | ||
|  | 		// Disk not found or ignored is a valid case.
 | ||
|  | 		if disk == nil { | ||
|  | 			// Return nil, one of the disk is offline.
 | ||
|  | 			return nil | ||
|  | 		} | ||
|  | 		formatXL, err := loadFormat(disk) | ||
|  | 		if err != nil { | ||
|  | 			if err == errUnformattedDisk { | ||
|  | 				// format.json is missing, should be healed.
 | ||
|  | 				continue | ||
|  | 			} else if err == errDiskNotFound { // Is a valid case we
 | ||
|  | 				// can proceed without healing.
 | ||
|  | 				return nil | ||
|  | 			} | ||
|  | 			// Return error for unsupported errors.
 | ||
|  | 			return err | ||
|  | 		} // Success.
 | ||
|  | 		formatConfigs[index] = formatXL | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// All `format.json` has been read successfully, previously completed.
 | ||
|  | 	if isFormatFound(formatConfigs) { | ||
|  | 		// Return success.
 | ||
|  | 		return nil | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// All disks are fresh, format.json will be written by initFormatXL()
 | ||
|  | 	if isFormatNotFound(formatConfigs) { | ||
|  | 		return initFormatXL(storageDisks) | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Validate format configs for consistency in JBOD and disks.
 | ||
|  | 	if err := checkFormatXL(formatConfigs); err != nil { | ||
|  | 		return err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	if referenceConfig == nil { | ||
|  | 		// This config will be used to update the drives missing format.json.
 | ||
|  | 		for _, formatConfig := range formatConfigs { | ||
|  | 			if formatConfig == nil { | ||
|  | 				continue | ||
|  | 			} | ||
|  | 			referenceConfig = formatConfig | ||
|  | 			break | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Collect new JBOD.
 | ||
|  | 	newJBOD := referenceConfig.XL.JBOD | ||
|  | 
 | ||
|  | 	// Reorder the disks based on the JBOD order.
 | ||
|  | 	orderedDisks, err := reorderDisks(storageDisks, formatConfigs) | ||
|  | 	if err != nil { | ||
|  | 		return err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// From ordered disks fill the UUID position.
 | ||
|  | 	for index, disk := range orderedDisks { | ||
|  | 		if disk == nil { | ||
|  | 			newJBOD[index] = getUUID() | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Collect new format configs.
 | ||
|  | 	var newFormatConfigs = make([]*formatConfigV1, len(orderedDisks)) | ||
|  | 
 | ||
|  | 	// Collect new format configs that need to be written.
 | ||
|  | 	for index := range orderedDisks { | ||
|  | 		// New configs are generated since we are going
 | ||
|  | 		// to re-populate across all disks.
 | ||
|  | 		config := &formatConfigV1{ | ||
|  | 			Version: referenceConfig.Version, | ||
|  | 			Format:  referenceConfig.Format, | ||
|  | 			XL: &xlFormat{ | ||
|  | 				Version: referenceConfig.XL.Version, | ||
|  | 				Disk:    newJBOD[index], | ||
|  | 				JBOD:    newJBOD, | ||
|  | 			}, | ||
|  | 		} | ||
|  | 		newFormatConfigs[index] = config | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Fill in the missing disk back from format configs.
 | ||
|  | 	// We need to make sure we have kept the previous order
 | ||
|  | 	// and allowed fresh disks to be arranged anywhere.
 | ||
|  | 	// Following block facilitates to put fresh disks.
 | ||
|  | 	for index, format := range formatConfigs { | ||
|  | 		// Format is missing so we go through ordered disks.
 | ||
|  | 		if format == nil { | ||
|  | 			// At this point when disk is missing the fresh disk
 | ||
|  | 			// in the stack get it back from storageDisks.
 | ||
|  | 			for oIndex, disk := range orderedDisks { | ||
|  | 				if disk == nil { | ||
|  | 					orderedDisks[oIndex] = storageDisks[index] | ||
|  | 					break | ||
|  | 				} | ||
|  | 			} | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Save new `format.json` across all disks, in JBOD order.
 | ||
|  | 	return saveFormatXL(orderedDisks, newFormatConfigs) | ||
|  | } | ||
|  | 
 | ||
|  | // Disks from storageDiks are put in assignedDisks if found in orderedDisks and in unAssignedDisks otherwise
 | ||
|  | func splitDisksByUse(storageDisks, orderedDisks []StorageAPI) (assignedDisks []StorageAPI, unAssignedDisks []StorageAPI) { | ||
|  | 	// Populate unAssignDisks
 | ||
|  | 	for i := range storageDisks { | ||
|  | 		found := false | ||
|  | 		for j := range orderedDisks { | ||
|  | 			if storageDisks[i] == orderedDisks[j] { | ||
|  | 				found = true | ||
|  | 				assignedDisks = append(assignedDisks, storageDisks[i]) | ||
|  | 				break | ||
|  | 			} | ||
|  | 		} | ||
|  | 		if !found { | ||
|  | 			unAssignedDisks = append(unAssignedDisks, storageDisks[i]) | ||
|  | 		} | ||
|  | 	} | ||
|  | 	return assignedDisks, unAssignedDisks | ||
|  | } | ||
|  | 
 | ||
|  | // Inspect the content of all disks to guess the right order according to the format files.
 | ||
|  | // The right order is represented in orderedDisks
 | ||
|  | func reorderDisksByInspection(orderedDisks, storageDisks []StorageAPI, formatConfigs []*formatConfigV1) ([]StorageAPI, error) { | ||
|  | 	for index, format := range formatConfigs { | ||
|  | 		if format != nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		vols, err := storageDisks[index].ListVols() | ||
|  | 		if err != nil { | ||
|  | 			return nil, err | ||
|  | 		} | ||
|  | 		if len(vols) == 0 { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		volName := "" | ||
|  | 		// Avoid picking minioMetaBucket because ListVols() returns a non ordered list
 | ||
|  | 		for i := range vols { | ||
|  | 			if vols[i].Name != minioMetaBucket { | ||
|  | 				volName = vols[i].Name | ||
|  | 				break | ||
|  | 			} | ||
|  | 		} | ||
|  | 		if volName == "" { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		objects, err := storageDisks[index].ListDir(volName, "") | ||
|  | 		if err != nil { | ||
|  | 			return nil, err | ||
|  | 		} | ||
|  | 		if len(objects) == 0 { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		xlData, err := readXLMeta(storageDisks[index], volName, objects[0]) | ||
|  | 		if err != nil { | ||
|  | 			if err == errFileNotFound { | ||
|  | 				continue | ||
|  | 			} | ||
|  | 			return nil, err | ||
|  | 		} | ||
|  | 		diskIndex := -1 | ||
|  | 		for i, d := range xlData.Erasure.Distribution { | ||
|  | 			if d == xlData.Erasure.Index { | ||
|  | 				diskIndex = i | ||
|  | 			} | ||
|  | 		} | ||
|  | 		// Check for found results
 | ||
|  | 		if diskIndex == -1 || orderedDisks[diskIndex] != nil { | ||
|  | 			// Some inconsistent data are found, exit immediately.
 | ||
|  | 			return nil, errCorruptedFormat | ||
|  | 		} | ||
|  | 		orderedDisks[diskIndex] = storageDisks[index] | ||
|  | 	} | ||
|  | 	return orderedDisks, nil | ||
|  | } | ||
|  | 
 | ||
|  | // Heals corrupted format json in all disks
 | ||
|  | func healFormatXLCorruptedDisks(storageDisks []StorageAPI) error { | ||
|  | 	formatConfigs := make([]*formatConfigV1, len(storageDisks)) | ||
|  | 	var referenceConfig *formatConfigV1 | ||
|  | 
 | ||
|  | 	// Loads `format.json` from all disks.
 | ||
|  | 	for index, disk := range storageDisks { | ||
|  | 		// Disk not found or ignored is a valid case.
 | ||
|  | 		if disk == nil { | ||
|  | 			// Return nil, one of the disk is offline.
 | ||
|  | 			return nil | ||
|  | 		} | ||
|  | 		formatXL, err := loadFormat(disk) | ||
|  | 		if err != nil { | ||
|  | 			if err == errUnformattedDisk || err == errCorruptedFormat { | ||
|  | 				// format.json is missing or corrupted, should be healed.
 | ||
|  | 				continue | ||
|  | 			} else if err == errDiskNotFound { // Is a valid case we
 | ||
|  | 				// can proceed without healing.
 | ||
|  | 				return nil | ||
|  | 			} | ||
|  | 			// Return error for unsupported errors.
 | ||
|  | 			return err | ||
|  | 		} // Success.
 | ||
|  | 		formatConfigs[index] = formatXL | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// All `format.json` has been read successfully, previously completed.
 | ||
|  | 	if isFormatFound(formatConfigs) { | ||
|  | 		// Return success.
 | ||
|  | 		return nil | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// All disks are fresh, format.json will be written by initFormatXL()
 | ||
|  | 	if isFormatNotFound(formatConfigs) { | ||
|  | 		return initFormatXL(storageDisks) | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Validate format configs for consistency in JBOD and disks.
 | ||
|  | 	if err := checkFormatXL(formatConfigs); err != nil { | ||
|  | 		return err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	if referenceConfig == nil { | ||
|  | 		// This config will be used to update the drives missing format.json.
 | ||
|  | 		for _, formatConfig := range formatConfigs { | ||
|  | 			if formatConfig == nil { | ||
|  | 				continue | ||
|  | 			} | ||
|  | 			referenceConfig = formatConfig | ||
|  | 			break | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Collect new JBOD.
 | ||
|  | 	newJBOD := referenceConfig.XL.JBOD | ||
|  | 
 | ||
|  | 	// Reorder the disks based on the JBOD order.
 | ||
|  | 	orderedDisks, err := reorderDisks(storageDisks, formatConfigs) | ||
|  | 	if err != nil { | ||
|  | 		return err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// From ordered disks fill the UUID position.
 | ||
|  | 	for index, disk := range orderedDisks { | ||
|  | 		if disk == nil { | ||
|  | 			newJBOD[index] = getUUID() | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// For disks with corrupted formats, inspect the disks contents to guess the disks order
 | ||
|  | 	orderedDisks, err = reorderDisksByInspection(orderedDisks, storageDisks, formatConfigs) | ||
|  | 	if err != nil { | ||
|  | 		return err | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// At this stage, all disks with corrupted formats but with objects inside found their way.
 | ||
|  | 	// Now take care of unformatted disks, which are the `unAssignedDisks`
 | ||
|  | 	_, unAssignedDisks := splitDisksByUse(storageDisks, orderedDisks) | ||
|  | 
 | ||
|  | 	// Assign unassigned disks to nil elements in orderedDisks
 | ||
|  | 	for i, disk := range orderedDisks { | ||
|  | 		if disk == nil && len(unAssignedDisks) > 0 { | ||
|  | 			orderedDisks[i] = unAssignedDisks[0] | ||
|  | 			unAssignedDisks = unAssignedDisks[1:] | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Collect new format configs.
 | ||
|  | 	var newFormatConfigs = make([]*formatConfigV1, len(orderedDisks)) | ||
|  | 
 | ||
|  | 	// Collect new format configs that need to be written.
 | ||
|  | 	for index := range orderedDisks { | ||
|  | 		// New configs are generated since we are going
 | ||
|  | 		// to re-populate across all disks.
 | ||
|  | 		config := &formatConfigV1{ | ||
|  | 			Version: referenceConfig.Version, | ||
|  | 			Format:  referenceConfig.Format, | ||
|  | 			XL: &xlFormat{ | ||
|  | 				Version: referenceConfig.XL.Version, | ||
|  | 				Disk:    newJBOD[index], | ||
|  | 				JBOD:    newJBOD, | ||
|  | 			}, | ||
|  | 		} | ||
|  | 		newFormatConfigs[index] = config | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Save new `format.json` across all disks, in JBOD order.
 | ||
|  | 	return saveFormatXL(orderedDisks, newFormatConfigs) | ||
|  | } | ||
|  | 
 | ||
|  | // loadFormatXL - loads XL `format.json` and returns back properly
 | ||
|  | // ordered storage slice based on `format.json`.
 | ||
|  | func loadFormatXL(bootstrapDisks []StorageAPI) (disks []StorageAPI, err error) { | ||
|  | 	var unformattedDisksFoundCnt = 0 | ||
|  | 	var diskNotFoundCount = 0 | ||
|  | 	formatConfigs := make([]*formatConfigV1, len(bootstrapDisks)) | ||
|  | 
 | ||
|  | 	// Try to load `format.json` bootstrap disks.
 | ||
|  | 	for index, disk := range bootstrapDisks { | ||
|  | 		if disk == nil { | ||
|  | 			diskNotFoundCount++ | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		var formatXL *formatConfigV1 | ||
|  | 		formatXL, err = loadFormat(disk) | ||
|  | 		if err != nil { | ||
|  | 			if err == errUnformattedDisk { | ||
|  | 				unformattedDisksFoundCnt++ | ||
|  | 				continue | ||
|  | 			} else if err == errDiskNotFound { | ||
|  | 				diskNotFoundCount++ | ||
|  | 				continue | ||
|  | 			} | ||
|  | 			return nil, err | ||
|  | 		} | ||
|  | 		// Save valid formats.
 | ||
|  | 		formatConfigs[index] = formatXL | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// If all disks indicate that 'format.json' is not available return 'errUnformattedDisk'.
 | ||
|  | 	if unformattedDisksFoundCnt > len(bootstrapDisks)-(len(bootstrapDisks)/2+1) { | ||
|  | 		return nil, errUnformattedDisk | ||
|  | 	} else if diskNotFoundCount == len(bootstrapDisks) { | ||
|  | 		return nil, errDiskNotFound | ||
|  | 	} else if diskNotFoundCount > len(bootstrapDisks)-(len(bootstrapDisks)/2+1) { | ||
|  | 		return nil, errXLReadQuorum | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Validate the format configs read are correct.
 | ||
|  | 	if err = checkFormatXL(formatConfigs); err != nil { | ||
|  | 		return nil, err | ||
|  | 	} | ||
|  | 	// Erasure code requires disks to be presented in the same order each time.
 | ||
|  | 	return reorderDisks(bootstrapDisks, formatConfigs) | ||
|  | } | ||
|  | 
 | ||
|  | // checkFormatXL - verifies if format.json format is intact.
 | ||
|  | func checkFormatXL(formatConfigs []*formatConfigV1) error { | ||
|  | 	for _, formatXL := range formatConfigs { | ||
|  | 		if formatXL == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		// Validate format version and format type.
 | ||
|  | 		if formatXL.Version != "1" { | ||
|  | 			return fmt.Errorf("Unsupported version of backend format [%s] found.", formatXL.Version) | ||
|  | 		} | ||
|  | 		if formatXL.Format != "xl" { | ||
|  | 			return fmt.Errorf("Unsupported backend format [%s] found.", formatXL.Format) | ||
|  | 		} | ||
|  | 		if formatXL.XL.Version != "1" { | ||
|  | 			return fmt.Errorf("Unsupported XL backend format found [%s]", formatXL.XL.Version) | ||
|  | 		} | ||
|  | 		if len(formatConfigs) != len(formatXL.XL.JBOD) { | ||
|  | 			return fmt.Errorf("Number of disks %d did not match the backend format %d", len(formatConfigs), len(formatXL.XL.JBOD)) | ||
|  | 		} | ||
|  | 	} | ||
|  | 	if err := checkJBODConsistency(formatConfigs); err != nil { | ||
|  | 		return err | ||
|  | 	} | ||
|  | 	return checkDisksConsistency(formatConfigs) | ||
|  | } | ||
|  | 
 | ||
|  | // saveFormatXL - populates `format.json` on disks in its order.
 | ||
|  | func saveFormatXL(storageDisks []StorageAPI, formats []*formatConfigV1) error { | ||
|  | 	var errs = make([]error, len(storageDisks)) | ||
|  | 	var wg = &sync.WaitGroup{} | ||
|  | 	// Write `format.json` to all disks.
 | ||
|  | 	for index, disk := range storageDisks { | ||
|  | 		if disk == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		wg.Add(1) | ||
|  | 		go func(index int, disk StorageAPI, format *formatConfigV1) { | ||
|  | 			defer wg.Done() | ||
|  | 
 | ||
|  | 			// Marshal and write to disk.
 | ||
|  | 			formatBytes, err := json.Marshal(format) | ||
|  | 			if err != nil { | ||
|  | 				errs[index] = err | ||
|  | 				return | ||
|  | 			} | ||
|  | 
 | ||
|  | 			// Purge any existing temporary file, okay to ignore errors here.
 | ||
|  | 			disk.DeleteFile(minioMetaBucket, formatConfigFileTmp) | ||
|  | 
 | ||
|  | 			// Append file `format.json.tmp`.
 | ||
|  | 			if err = disk.AppendFile(minioMetaBucket, formatConfigFileTmp, formatBytes); err != nil { | ||
|  | 				errs[index] = err | ||
|  | 				return | ||
|  | 			} | ||
|  | 			// Rename file `format.json.tmp` --> `format.json`.
 | ||
|  | 			if err = disk.RenameFile(minioMetaBucket, formatConfigFileTmp, minioMetaBucket, formatConfigFile); err != nil { | ||
|  | 				errs[index] = err | ||
|  | 				return | ||
|  | 			} | ||
|  | 		}(index, disk, formats[index]) | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Wait for the routines to finish.
 | ||
|  | 	wg.Wait() | ||
|  | 
 | ||
|  | 	// Validate if we encountered any errors, return quickly.
 | ||
|  | 	for _, err := range errs { | ||
|  | 		if err != nil { | ||
|  | 			// Failure.
 | ||
|  | 			return err | ||
|  | 		} | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Success.
 | ||
|  | 	return nil | ||
|  | } | ||
|  | 
 | ||
|  | // initFormatXL - save XL format configuration on all disks.
 | ||
|  | func initFormatXL(storageDisks []StorageAPI) (err error) { | ||
|  | 	// Initialize jbods.
 | ||
|  | 	var jbod = make([]string, len(storageDisks)) | ||
|  | 
 | ||
|  | 	// Initialize formats.
 | ||
|  | 	var formats = make([]*formatConfigV1, len(storageDisks)) | ||
|  | 
 | ||
|  | 	// Initialize `format.json`.
 | ||
|  | 	for index, disk := range storageDisks { | ||
|  | 		if disk == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		// Allocate format config.
 | ||
|  | 		formats[index] = &formatConfigV1{ | ||
|  | 			Version: "1", | ||
|  | 			Format:  "xl", | ||
|  | 			XL: &xlFormat{ | ||
|  | 				Version: "1", | ||
|  | 				Disk:    getUUID(), | ||
|  | 			}, | ||
|  | 		} | ||
|  | 		jbod[index] = formats[index].XL.Disk | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Update the jbod entries.
 | ||
|  | 	for index, disk := range storageDisks { | ||
|  | 		if disk == nil { | ||
|  | 			continue | ||
|  | 		} | ||
|  | 		// Save jbod.
 | ||
|  | 		formats[index].XL.JBOD = jbod | ||
|  | 	} | ||
|  | 
 | ||
|  | 	// Save formats `format.json` across all disks.
 | ||
|  | 	return saveFormatXL(storageDisks, formats) | ||
|  | } |