ollama/convert/reader_safetensors.go

package convert

import (
	"bufio"
	"bytes"
	"encoding/binary"
	"encoding/json"
	"errors"
	"fmt"
	"io"
	"io/fs"
	"maps"
	"slices"
	"strings"

	"github.com/d4l3k/go-bfloat16"
	"github.com/x448/float16"
)

type safetensorMetadata struct {
	Type    string   `json:"dtype"`
	Shape   []uint64 `json:"shape"`
	Offsets []int64  `json:"data_offsets"`
}

func parseSafetensors(fsys fs.FS, replacer *strings.Replacer, ps ...string) ([]Tensor, error) {
	var ts []Tensor
	for _, p := range ps {
		f, err := fsys.Open(p)
		if err != nil {
			return nil, err
		}
		defer f.Close()

		var n int64
		if err := binary.Read(f, binary.LittleEndian, &n); err != nil {
			return nil, err
		}

		b := bytes.NewBuffer(make([]byte, 0, n))
		if _, err = io.CopyN(b, f, n); err != nil {
			return nil, err
		}

		var headers map[string]safetensorMetadata
		if err := json.NewDecoder(b).Decode(&headers); err != nil {
			return nil, err
		}

		keys := slices.Sorted(maps.Keys(headers))

		names := make(map[string]struct{}, len(keys))

		for _, key := range keys {
			if value := headers[key]; value.Type != "" {
				// bitsandbytes quantized models are unsupported
				if len(value.Shape) == 0 {
					return nil, errors.New("unsupported safetensors model")
				}
				ggufName := replacer.Replace(key)
				if _, ok := names[ggufName]; ok {
					return nil, fmt.Errorf("duplicate tensor name '%s' was found for this model", ggufName)
				}
				names[ggufName] = struct{}{}
				ts = append(ts, safetensor{
					fs:     fsys,
					path:   p,
					dtype:  value.Type,
					offset: safetensorsPad(n, value.Offsets[0]),
					size:   safetensorsPad(n, value.Offsets[1]) - safetensorsPad(n, value.Offsets[0]),
					tensorBase: &tensorBase{
						name:  ggufName,
						shape: value.Shape,
					},
				})
			}
		}
	}

	return ts, nil
}

// safetensorsPad returns the padded size of the safetensors file given a length n and offset s
func safetensorsPad(n, offset int64) int64 {
	return 8 + n + offset
}

type safetensor struct {
	fs     fs.FS
	path   string
	dtype  string
	offset int64
	size   int64
	*tensorBase
}

func (st safetensor) Kind() uint32 {
	kind := st.tensorBase.Kind()
	if !strings.HasPrefix(st.name, "v.") && st.dtype == "BF16" && kind != tensorKindFP32 {
		kind = tensorKindBF16
	}

	return kind
}

func (st safetensor) Clone() Tensor {
	return &safetensor{
		fs:     st.fs,
		path:   st.path,
		dtype:  st.dtype,
		offset: st.offset,
		size:   st.size,
		tensorBase: &tensorBase{
			name:     st.name,
			repacker: st.repacker,
			shape:    slices.Clone(st.shape),
		},
	}
}

func (st safetensor) WriteTo(w io.Writer) (int64, error) {
	f, err := st.fs.Open(st.path)
	if err != nil {
		return 0, err
	}
	defer f.Close()

	r, err := func() (io.Reader, error) {
		if readerAt, ok := f.(io.ReaderAt); ok {
			return io.NewSectionReader(readerAt, st.offset, st.size), nil
		} else if seeker, ok := f.(io.Seeker); ok {
			_, err := seeker.Seek(st.offset, io.SeekStart)
			return f, err
		} else {
			_, err := io.CopyN(io.Discard, f, st.offset)
			return f, err
		}
	}()
	if err != nil {
		return 0, err
	}

	br := bufio.NewReaderSize(r, min(32<<10, int(st.size)))
	// special case when input and output are same type and the
	// tensor doesn't need repacking
	if (st.repacker == nil) &&
		((st.dtype == "F32" && st.Kind() == tensorKindFP32) ||
			(st.dtype == "F16" && st.Kind() == tensorKindFP16) ||
			(st.dtype == "U8")) {
		return io.CopyN(w, br, st.size)
	}

	var f32s []float32
	switch st.dtype {
	case "F32":
		f32s = make([]float32, st.size/4)
		if err = binary.Read(br, binary.LittleEndian, f32s); err != nil {
			return 0, err
		}
	case "F16":
		u16s := make([]uint16, st.size/2)
		if err = binary.Read(br, binary.LittleEndian, u16s); err != nil {
			return 0, err
		}

		f32s = make([]float32, len(u16s))
		for i := range u16s {
			f32s[i] = float16.Frombits(u16s[i]).Float32()
		}

	case "BF16":
		u8s := make([]uint8, st.size)
		if err = binary.Read(br, binary.LittleEndian, u8s); err != nil {
			return 0, err
		}

		f32s = bfloat16.DecodeFloat32(u8s)
	default:
		return 0, fmt.Errorf("unknown data type: %s", st.dtype)
	}

	if st.repacker != nil {
		f32s, err = st.repacker(st.Name(), f32s, st.Shape())
		if err != nil {
			return 0, err
		}
	}

	switch st.Kind() {
	case tensorKindFP32:
		return int64(len(f32s) * 4), binary.Write(w, binary.LittleEndian, f32s)
	case tensorKindFP16:
		f16s := make([]uint16, len(f32s))
		for i := range f32s {
			f16s[i] = float16.Fromfloat32(f32s[i]).Bits()
		}

		return int64(len(f16s) * 2), binary.Write(w, binary.LittleEndian, f16s)
	case tensorKindBF16:
		u8s := bfloat16.EncodeFloat32(f32s)
		return int64(len(u8s)), binary.Write(w, binary.LittleEndian, u8s)
	default:
		return 0, fmt.Errorf("unknown storage type: %d", st.Kind())
	}
}
refactor convert 2024-06-01 11:00:49 +08:00			`package convert`

			`import (`
convert: skip reading into memory when possible (#11507) if there's no transformation to the tensor and the input and output types match, copy directly into the writer. also read from a bufio with a 32K buffer 2025-08-15 06:03:57 +08:00			`"bufio"`
refactor convert 2024-06-01 11:00:49 +08:00			`"bytes"`
			`"encoding/binary"`
			`"encoding/json"`
throw an error when encountering unsupport tensor sizes (#6538) 2024-08-28 08:54:04 +08:00			`"errors"`
refactor convert 2024-06-01 11:00:49 +08:00			`"fmt"`
			`"io"`
convert: only extract large files 2024-06-30 07:53:59 +08:00			`"io/fs"`
s#x/exp/maps#maps# (#11506) 2025-07-24 04:23:32 +08:00			`"maps"`
refactor convert 2024-06-01 11:00:49 +08:00			`"slices"`
convert gemma2 2024-06-29 04:27:05 +08:00			`"strings"`
refactor convert 2024-06-01 11:00:49 +08:00
			`"github.com/d4l3k/go-bfloat16"`
			`"github.com/x448/float16"`
			`)`

			`type safetensorMetadata struct {`
			Type string `json:"dtype"`
			Shape []uint64 `json:"shape"`
			Offsets []int64 `json:"data_offsets"`
			`}`

convert gemma2 2024-06-29 04:27:05 +08:00			`func parseSafetensors(fsys fs.FS, replacer *strings.Replacer, ps ...string) ([]Tensor, error) {`
refactor convert 2024-06-01 11:00:49 +08:00			`var ts []Tensor`
			`for _, p := range ps {`
convert: only extract large files 2024-06-30 07:53:59 +08:00			`f, err := fsys.Open(p)`
refactor convert 2024-06-01 11:00:49 +08:00			`if err != nil {`
			`return nil, err`
			`}`
			`defer f.Close()`

			`var n int64`
			`if err := binary.Read(f, binary.LittleEndian, &n); err != nil {`
			`return nil, err`
			`}`

			`b := bytes.NewBuffer(make([]byte, 0, n))`
			`if _, err = io.CopyN(b, f, n); err != nil {`
			`return nil, err`
			`}`

			`var headers map[string]safetensorMetadata`
			`if err := json.NewDecoder(b).Decode(&headers); err != nil {`
			`return nil, err`
			`}`

s#x/exp/maps#maps# (#11506) 2025-07-24 04:23:32 +08:00			`keys := slices.Sorted(maps.Keys(headers))`
refactor convert 2024-06-01 11:00:49 +08:00
Fix gemma2 2b conversion (#6645) 2024-09-06 08:02:28 +08:00			`names := make(map[string]struct{}, len(keys))`

refactor convert 2024-06-01 11:00:49 +08:00			`for _, key := range keys {`
			`if value := headers[key]; value.Type != "" {`
throw an error when encountering unsupport tensor sizes (#6538) 2024-08-28 08:54:04 +08:00			`// bitsandbytes quantized models are unsupported`
			`if len(value.Shape) == 0 {`
			`return nil, errors.New("unsupported safetensors model")`
			`}`
Fix gemma2 2b conversion (#6645) 2024-09-06 08:02:28 +08:00			`ggufName := replacer.Replace(key)`
			`if _, ok := names[ggufName]; ok {`
			`return nil, fmt.Errorf("duplicate tensor name '%s' was found for this model", ggufName)`
			`}`
			`names[ggufName] = struct{}{}`
refactor convert 2024-06-01 11:00:49 +08:00			`ts = append(ts, safetensor{`
convert: only extract large files 2024-06-30 07:53:59 +08:00			`fs: fsys,`
refactor convert 2024-06-01 11:00:49 +08:00			`path: p,`
			`dtype: value.Type,`
			`offset: safetensorsPad(n, value.Offsets[0]),`
			`size: safetensorsPad(n, value.Offsets[1]) - safetensorsPad(n, value.Offsets[0]),`
			`tensorBase: &tensorBase{`
Fix gemma2 2b conversion (#6645) 2024-09-06 08:02:28 +08:00			`name: ggufName,`
refactor convert 2024-06-01 11:00:49 +08:00			`shape: value.Shape,`
			`},`
			`})`
			`}`
			`}`
			`}`

			`return ts, nil`
			`}`

comments 2024-07-09 07:59:48 +08:00			`// safetensorsPad returns the padded size of the safetensors file given a length n and offset s`
Update convert/reader_safetensors.go Co-authored-by: Jeffrey Morgan <jmorganca@gmail.com> 2024-08-01 01:58:22 +08:00			`func safetensorsPad(n, offset int64) int64 {`
			`return 8 + n + offset`
refactor convert 2024-06-01 11:00:49 +08:00			`}`

			`type safetensor struct {`
convert: only extract large files 2024-06-30 07:53:59 +08:00			`fs fs.FS`
refactor convert 2024-06-01 11:00:49 +08:00			`path string`
			`dtype string`
			`offset int64`
			`size int64`
			`*tensorBase`
			`}`

gpt-oss (#11672) * bf16 * tests * gpt-oss * enable gptoss for engine * rough estimate * convert to mxfp4 * handle safetensors U8 * clamp glu/linear * update tokenizer * MXFP4 support This implements the Open Compute Microscaling (MX) FP4 format as a tensor type with backend implementations focusing on mulmat and mulmatid on CPU, CUDA, and Metal. * Unit tests for MXFP4 support This exercises various operations and shapes on both CPU and GPU (if detected on the system) * cuda graph * unit test adjustments * cuda: optimize memory access Read 4 bytes at a time (8 elements) when performing mul_mat_vec_mxfp4 * mac: fix crash on old macos versions cblas_sgemm is only supported on v13.3 and up, however bf16 is only supported on v14+ so we were falling back to ggml-blas and crashing on bf16 tensors. Checking for the function being null seems to be the simplest way to condittionally avoid registering the backend. * server: Minimum context length for gptoss This model requires a minimum context length of 8192 to function effectively. Users can set higher values through all normal mechanisms but lower values will be silently reset. * ggml: Multiply by numParallel for gptoss sliding window When computing the graph size estimate, the context size is already multiplied by numParallel so estimates reflect that. However, since sliding window models use a smaller, fixed context size, they need to manually take numParallel into account. * gpt-oss integration includes harmony parser and thinking levels, etc. * fix sync * fix tests * fix lint --------- Co-authored-by: Daniel Hiltgen <daniel@ollama.com> Co-authored-by: Jesse Gross <jesse@ollama.com> Co-authored-by: Devon Rifkin <drifkin@drifkin.net> 2025-08-06 03:21:16 +08:00			`func (st safetensor) Kind() uint32 {`
			`kind := st.tensorBase.Kind()`
convert: convert bf16 vision weights to fp16 (#12324) This change moves back to converting bf16 vision weights to fp16, specifically if they start with the name "v." (such as v.blk.0.attn_k.weight). This fixes a bug where converted images are failing because they are trying to call `im2col` which doesn't have a bf16 kernel in ggml. 2025-09-18 08:43:17 +08:00			`if !strings.HasPrefix(st.name, "v.") && st.dtype == "BF16" && kind != tensorKindFP32 {`
gpt-oss (#11672) * bf16 * tests * gpt-oss * enable gptoss for engine * rough estimate * convert to mxfp4 * handle safetensors U8 * clamp glu/linear * update tokenizer * MXFP4 support This implements the Open Compute Microscaling (MX) FP4 format as a tensor type with backend implementations focusing on mulmat and mulmatid on CPU, CUDA, and Metal. * Unit tests for MXFP4 support This exercises various operations and shapes on both CPU and GPU (if detected on the system) * cuda graph * unit test adjustments * cuda: optimize memory access Read 4 bytes at a time (8 elements) when performing mul_mat_vec_mxfp4 * mac: fix crash on old macos versions cblas_sgemm is only supported on v13.3 and up, however bf16 is only supported on v14+ so we were falling back to ggml-blas and crashing on bf16 tensors. Checking for the function being null seems to be the simplest way to condittionally avoid registering the backend. * server: Minimum context length for gptoss This model requires a minimum context length of 8192 to function effectively. Users can set higher values through all normal mechanisms but lower values will be silently reset. * ggml: Multiply by numParallel for gptoss sliding window When computing the graph size estimate, the context size is already multiplied by numParallel so estimates reflect that. However, since sliding window models use a smaller, fixed context size, they need to manually take numParallel into account. * gpt-oss integration includes harmony parser and thinking levels, etc. * fix sync * fix tests * fix lint --------- Co-authored-by: Daniel Hiltgen <daniel@ollama.com> Co-authored-by: Jesse Gross <jesse@ollama.com> Co-authored-by: Devon Rifkin <drifkin@drifkin.net> 2025-08-06 03:21:16 +08:00			`kind = tensorKindBF16`
			`}`

			`return kind`
			`}`

llama4 2025-04-04 06:18:29 +08:00			`func (st safetensor) Clone() Tensor {`
			`return &safetensor{`
			`fs: st.fs,`
			`path: st.path,`
			`dtype: st.dtype,`
			`offset: st.offset,`
			`size: st.size,`
			`tensorBase: &tensorBase{`
			`name: st.name,`
			`repacker: st.repacker,`
			`shape: slices.Clone(st.shape),`
			`},`
			`}`
			`}`

refactor convert 2024-06-01 11:00:49 +08:00			`func (st safetensor) WriteTo(w io.Writer) (int64, error) {`
convert: only extract large files 2024-06-30 07:53:59 +08:00			`f, err := st.fs.Open(st.path)`
refactor convert 2024-06-01 11:00:49 +08:00			`if err != nil {`
			`return 0, err`
			`}`
			`defer f.Close()`

convert: skip reading into memory when possible (#11507) if there's no transformation to the tensor and the input and output types match, copy directly into the writer. also read from a bufio with a 32K buffer 2025-08-15 06:03:57 +08:00			`r, err := func() (io.Reader, error) {`
			`if readerAt, ok := f.(io.ReaderAt); ok {`
			`return io.NewSectionReader(readerAt, st.offset, st.size), nil`
			`} else if seeker, ok := f.(io.Seeker); ok {`
			`_, err := seeker.Seek(st.offset, io.SeekStart)`
			`return f, err`
			`} else {`
			`_, err := io.CopyN(io.Discard, f, st.offset)`
			`return f, err`
convert: only extract large files 2024-06-30 07:53:59 +08:00			`}`
convert: skip reading into memory when possible (#11507) if there's no transformation to the tensor and the input and output types match, copy directly into the writer. also read from a bufio with a 32K buffer 2025-08-15 06:03:57 +08:00			`}()`
			`if err != nil {`
			`return 0, err`
			`}`

			`br := bufio.NewReaderSize(r, min(32<<10, int(st.size)))`
			`// special case when input and output are same type and the`
			`// tensor doesn't need repacking`
			`if (st.repacker == nil) &&`
			`((st.dtype == "F32" && st.Kind() == tensorKindFP32) \|\|`
			`(st.dtype == "F16" && st.Kind() == tensorKindFP16) \|\|`
			`(st.dtype == "U8")) {`
			`return io.CopyN(w, br, st.size)`
refactor convert 2024-06-01 11:00:49 +08:00			`}`

			`var f32s []float32`
			`switch st.dtype {`
			`case "F32":`
			`f32s = make([]float32, st.size/4)`
convert: skip reading into memory when possible (#11507) if there's no transformation to the tensor and the input and output types match, copy directly into the writer. also read from a bufio with a 32K buffer 2025-08-15 06:03:57 +08:00			`if err = binary.Read(br, binary.LittleEndian, f32s); err != nil {`
refactor convert 2024-06-01 11:00:49 +08:00			`return 0, err`
			`}`
			`case "F16":`
			`u16s := make([]uint16, st.size/2)`
convert: skip reading into memory when possible (#11507) if there's no transformation to the tensor and the input and output types match, copy directly into the writer. also read from a bufio with a 32K buffer 2025-08-15 06:03:57 +08:00			`if err = binary.Read(br, binary.LittleEndian, u16s); err != nil {`
refactor convert 2024-06-01 11:00:49 +08:00			`return 0, err`
			`}`

lint 2024-08-02 05:52:15 +08:00			`f32s = make([]float32, len(u16s))`
			`for i := range u16s {`
			`f32s[i] = float16.Frombits(u16s[i]).Float32()`
refactor convert 2024-06-01 11:00:49 +08:00			`}`

			`case "BF16":`
			`u8s := make([]uint8, st.size)`
convert: skip reading into memory when possible (#11507) if there's no transformation to the tensor and the input and output types match, copy directly into the writer. also read from a bufio with a 32K buffer 2025-08-15 06:03:57 +08:00			`if err = binary.Read(br, binary.LittleEndian, u8s); err != nil {`
refactor convert 2024-06-01 11:00:49 +08:00			`return 0, err`
			`}`

			`f32s = bfloat16.DecodeFloat32(u8s)`
			`default:`
			`return 0, fmt.Errorf("unknown data type: %s", st.dtype)`
			`}`

			`if st.repacker != nil {`
			`f32s, err = st.repacker(st.Name(), f32s, st.Shape())`
			`if err != nil {`
			`return 0, err`
			`}`
			`}`

			`switch st.Kind() {`
gpt-oss (#11672) * bf16 * tests * gpt-oss * enable gptoss for engine * rough estimate * convert to mxfp4 * handle safetensors U8 * clamp glu/linear * update tokenizer * MXFP4 support This implements the Open Compute Microscaling (MX) FP4 format as a tensor type with backend implementations focusing on mulmat and mulmatid on CPU, CUDA, and Metal. * Unit tests for MXFP4 support This exercises various operations and shapes on both CPU and GPU (if detected on the system) * cuda graph * unit test adjustments * cuda: optimize memory access Read 4 bytes at a time (8 elements) when performing mul_mat_vec_mxfp4 * mac: fix crash on old macos versions cblas_sgemm is only supported on v13.3 and up, however bf16 is only supported on v14+ so we were falling back to ggml-blas and crashing on bf16 tensors. Checking for the function being null seems to be the simplest way to condittionally avoid registering the backend. * server: Minimum context length for gptoss This model requires a minimum context length of 8192 to function effectively. Users can set higher values through all normal mechanisms but lower values will be silently reset. * ggml: Multiply by numParallel for gptoss sliding window When computing the graph size estimate, the context size is already multiplied by numParallel so estimates reflect that. However, since sliding window models use a smaller, fixed context size, they need to manually take numParallel into account. * gpt-oss integration includes harmony parser and thinking levels, etc. * fix sync * fix tests * fix lint --------- Co-authored-by: Daniel Hiltgen <daniel@ollama.com> Co-authored-by: Jesse Gross <jesse@ollama.com> Co-authored-by: Devon Rifkin <drifkin@drifkin.net> 2025-08-06 03:21:16 +08:00			`case tensorKindFP32:`
convert(gptoss): mxfp4 to ggml layout to avoid jit conversion (#12018) * convert: return bytes written * ggml flavor mxfp4 * simplify jit conversion * comment 2025-08-27 07:41:02 +08:00			`return int64(len(f32s) * 4), binary.Write(w, binary.LittleEndian, f32s)`
gpt-oss (#11672) * bf16 * tests * gpt-oss * enable gptoss for engine * rough estimate * convert to mxfp4 * handle safetensors U8 * clamp glu/linear * update tokenizer * MXFP4 support This implements the Open Compute Microscaling (MX) FP4 format as a tensor type with backend implementations focusing on mulmat and mulmatid on CPU, CUDA, and Metal. * Unit tests for MXFP4 support This exercises various operations and shapes on both CPU and GPU (if detected on the system) * cuda graph * unit test adjustments * cuda: optimize memory access Read 4 bytes at a time (8 elements) when performing mul_mat_vec_mxfp4 * mac: fix crash on old macos versions cblas_sgemm is only supported on v13.3 and up, however bf16 is only supported on v14+ so we were falling back to ggml-blas and crashing on bf16 tensors. Checking for the function being null seems to be the simplest way to condittionally avoid registering the backend. * server: Minimum context length for gptoss This model requires a minimum context length of 8192 to function effectively. Users can set higher values through all normal mechanisms but lower values will be silently reset. * ggml: Multiply by numParallel for gptoss sliding window When computing the graph size estimate, the context size is already multiplied by numParallel so estimates reflect that. However, since sliding window models use a smaller, fixed context size, they need to manually take numParallel into account. * gpt-oss integration includes harmony parser and thinking levels, etc. * fix sync * fix tests * fix lint --------- Co-authored-by: Daniel Hiltgen <daniel@ollama.com> Co-authored-by: Jesse Gross <jesse@ollama.com> Co-authored-by: Devon Rifkin <drifkin@drifkin.net> 2025-08-06 03:21:16 +08:00			`case tensorKindFP16:`
refactor convert 2024-06-01 11:00:49 +08:00			`f16s := make([]uint16, len(f32s))`
			`for i := range f32s {`
			`f16s[i] = float16.Fromfloat32(f32s[i]).Bits()`
			`}`

convert(gptoss): mxfp4 to ggml layout to avoid jit conversion (#12018) * convert: return bytes written * ggml flavor mxfp4 * simplify jit conversion * comment 2025-08-27 07:41:02 +08:00			`return int64(len(f16s) * 2), binary.Write(w, binary.LittleEndian, f16s)`
gpt-oss (#11672) * bf16 * tests * gpt-oss * enable gptoss for engine * rough estimate * convert to mxfp4 * handle safetensors U8 * clamp glu/linear * update tokenizer * MXFP4 support This implements the Open Compute Microscaling (MX) FP4 format as a tensor type with backend implementations focusing on mulmat and mulmatid on CPU, CUDA, and Metal. * Unit tests for MXFP4 support This exercises various operations and shapes on both CPU and GPU (if detected on the system) * cuda graph * unit test adjustments * cuda: optimize memory access Read 4 bytes at a time (8 elements) when performing mul_mat_vec_mxfp4 * mac: fix crash on old macos versions cblas_sgemm is only supported on v13.3 and up, however bf16 is only supported on v14+ so we were falling back to ggml-blas and crashing on bf16 tensors. Checking for the function being null seems to be the simplest way to condittionally avoid registering the backend. * server: Minimum context length for gptoss This model requires a minimum context length of 8192 to function effectively. Users can set higher values through all normal mechanisms but lower values will be silently reset. * ggml: Multiply by numParallel for gptoss sliding window When computing the graph size estimate, the context size is already multiplied by numParallel so estimates reflect that. However, since sliding window models use a smaller, fixed context size, they need to manually take numParallel into account. * gpt-oss integration includes harmony parser and thinking levels, etc. * fix sync * fix tests * fix lint --------- Co-authored-by: Daniel Hiltgen <daniel@ollama.com> Co-authored-by: Jesse Gross <jesse@ollama.com> Co-authored-by: Devon Rifkin <drifkin@drifkin.net> 2025-08-06 03:21:16 +08:00			`case tensorKindBF16:`
			`u8s := bfloat16.EncodeFloat32(f32s)`
convert(gptoss): mxfp4 to ggml layout to avoid jit conversion (#12018) * convert: return bytes written * ggml flavor mxfp4 * simplify jit conversion * comment 2025-08-27 07:41:02 +08:00			`return int64(len(u8s)), binary.Write(w, binary.LittleEndian, u8s)`
refactor convert 2024-06-01 11:00:49 +08:00			`default:`
			`return 0, fmt.Errorf("unknown storage type: %d", st.Kind())`
			`}`
			`}`