Upgrade Onnxruntime, OpenXLA and Go versions

RJKeevil · RJKeevil · commit 98bca6250cba · 2025-05-24T14:01:13.000+02:00
diff --git a/.github/workflows/release.yaml b/.github/workflows/release.yaml
@@ -26,7 +26,7 @@ jobs:
       - name: Set up Go
         uses: actions/setup-go@v2
         with:
-          go-version: '1.23.3'
+          go-version: '1.24.3'
       - name: Checkout code
         uses: actions/checkout@v4
       - name: Install dependencies
diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml
@@ -16,7 +16,7 @@ jobs:
       - name: Set up Go
         uses: actions/setup-go@v2
         with:
-          go-version: '1.23.3'
+          go-version: '1.24.3'
       - name: Checkout code
         uses: actions/checkout@v4
       - name: Install dependencies
diff --git a/.golangci.yml b/.golangci.yml
@@ -1,5 +1,4 @@
 linters:
-  disable-all: true
   enable:
    # Check for pass []any as any in variadic func(...any).
     # Rare case but saved me from debugging a few times.
@@ -129,4 +128,5 @@ linters:
     - usestdlibvars
 
     # Finds wasted assignment statements.
-    - wastedassign
+    - wastedassign
+version: "2"
diff --git a/Dockerfile b/Dockerfile
@@ -1,7 +1,7 @@
 #--- dockerfile to test hugot  ---
 
 ARG GO_VERSION=1.24.3
-ARG ONNXRUNTIME_VERSION=1.21.0
+ARG ONNXRUNTIME_VERSION=1.22.0
 ARG BUILD_PLATFORM=linux/amd64
 
 #--- runtime layer with all hugot dependencies for cpu ---
diff --git a/README.md b/README.md
@@ -8,6 +8,8 @@
 
 ## What
 
+TL;DR: AI use-cases such as embeddings, text classification, named entity recognition, fine-tuning, and more!
+
 The goal of this library is to provide an easy, scalable, and hassle-free way to run transformer pipelines inference and training in golang applications, such as Hugging Face 🤗 transformers pipelines. It is built on the following principles:
 
 1. Hugging Face compatibility: models trained and tested using the python huggingface transformer library can be exported to onnx and used with the hugot pipelines to obtain identical predictions as in the python version.
@@ -17,17 +19,19 @@ The goal of this library is to provide an easy, scalable, and hassle-free way to
 
 We support inference on CPU and on all accelerators supported by ONNX Runtime/OpenXLA. Note however that currently only CPU, and GPU inference on Nvidia GPUs via CUDA, are tested (see below).
 
+Hugot loads and saves models in the ONNX format.
+
 ## Why
 
-Developing and fine-tuning transformer models with the Hugging Face python library is a great experience, but if your production stack is golang-based being able to reliably deploy and scale the resulting pytorch models can be challenging and can require quite some setup. This library aims to allow you to just lift-and-shift your python model and use the same Hugging Face pipelines you use for development for inference in a go application.
+Developing and fine-tuning transformer models with the Hugging Face python library is great, but if your production stack is golang-based being able to reliably deploy and scale the resulting pytorch models can be challenging. This library aims to allow you to just lift-and-shift your python model and use the same Hugging Face pipelines you use for development for inference in a go application.
 
 ## For whom
 
 For the golang developer or ML engineer who wants to run or fine-tune transformer pipelines on their own hardware and tightly coupled with their own application, without having to deal with writing their own inference or training code.
 
 ## By whom
 
-Hugot is brought to you by the friendly folks at [Knights Analytics](https://knightsanalytics.com), who use Hugot in production to automate ai-powered decision intelligence.
+Hugot is brought to you by the friendly folks at [Knights Analytics](https://knightsanalytics.com), who use Hugot in production to automate ai-powered data curation.
 
 ## Implemented pipelines
 
@@ -238,7 +242,7 @@ We is currently supported only for the **FeatureExtractionPipeline**. This can b
 {"sentence1": "The quick brown fox jumps over the lazy dog", "sentence2": "A quick brown cow jumps over a lazy caterpillar", "score": 0.5}
 ```
 
-See the [example](./testData/sts-train.jsonl) for a sample dataset.
+See the [example](./testData/semanticSimilarityTest.jsonl) for a sample dataset.
 
 The score is assumed to be a float between 0 and 1 that encodes the semantic similarity between the sentences, and by default a cosine similarity loss is used (see [sentence transformers](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss)). However, you can also specify a different loss function from `goMLX` using the `XLATrainingOptions` field in the `TrainingConfig` struct. See [the training tests](./hugot_training_test.go) for examples on how to train or fine-tune feature extraction pipelines.
 
diff --git a/cuda.Dockerfile b/cuda.Dockerfile
@@ -1,7 +1,7 @@
 #--- dockerfile to test hugot  ---
 
 ARG GO_VERSION=1.24.3
-ARG ONNXRUNTIME_VERSION=1.21.0
+ARG ONNXRUNTIME_VERSION=1.22.0
 ARG BUILD_PLATFORM=linux/amd64
 
 #--- runtime layer with all hugot dependencies for cpu and gpu ---
diff --git a/go.mod b/go.mod
@@ -1,25 +1,25 @@
 module github.com/knights-analytics/hugot
 
-go 1.23.3
+go 1.24
 
 require (
 	github.com/daulet/tokenizers v1.20.2
 	github.com/gomlx/exceptions v0.0.3
 	github.com/gomlx/go-huggingface v0.2.0
-	github.com/gomlx/gomlx v0.19.2
-	github.com/gomlx/gopjrt v0.7.0
-	github.com/gomlx/onnx-gomlx v0.2.1
+	github.com/gomlx/gomlx v0.19.4
+	github.com/gomlx/gopjrt v0.7.1
+	github.com/gomlx/onnx-gomlx v0.2.2
 	github.com/json-iterator/go v1.1.12
 	github.com/mattn/go-isatty v0.0.20
 	github.com/stretchr/testify v1.10.0
 	github.com/urfave/cli/v2 v2.27.6
 	github.com/viant/afs v1.26.2
-	github.com/yalue/onnxruntime_go v1.19.0
+	github.com/yalue/onnxruntime_go v1.19.1-0.20250521134902-f70a71e4f522
 	golang.org/x/exp v0.0.0-20250506013437-ce4c2cf36ca6
 )
 
 require (
-	github.com/cpuguy83/go-md2man/v2 v2.0.6 // indirect
+	github.com/cpuguy83/go-md2man/v2 v2.0.7 // indirect
 	github.com/davecgh/go-spew v1.1.1 // indirect
 	github.com/dustin/go-humanize v1.0.1 // indirect
 	github.com/go-errors/errors v1.5.1 // indirect
diff --git a/go.sum b/go.sum
@@ -1,5 +1,5 @@
-github.com/cpuguy83/go-md2man/v2 v2.0.6 h1:XJtiaUW6dEEqVuZiMTn1ldk455QWwEIsMIJlo5vtkx0=
-github.com/cpuguy83/go-md2man/v2 v2.0.6/go.mod h1:oOW0eioCTA6cOiMLiUPZOpcVxMig6NIQQ7OS05n1F4g=
+github.com/cpuguy83/go-md2man/v2 v2.0.7 h1:zbFlGlXEAKlwXpmvle3d8Oe3YnkKIK4xSRTd3sHPnBo=
+github.com/cpuguy83/go-md2man/v2 v2.0.7/go.mod h1:oOW0eioCTA6cOiMLiUPZOpcVxMig6NIQQ7OS05n1F4g=
 github.com/daulet/tokenizers v1.20.2 h1:tlq/vIOiBTKDPets3596aFvmJYLn3XI6LFKq4q9LKhQ=
 github.com/daulet/tokenizers v1.20.2/go.mod h1:tGnMdZthXdcWY6DGD07IygpwJqiPvG85FQUnhs/wSCs=
 github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
@@ -17,12 +17,12 @@ github.com/gomlx/exceptions v0.0.3 h1:HKnTgEjj4jlmhr8zVFkTP9qmV1ey7ypYYosQ8GzXWu
 github.com/gomlx/exceptions v0.0.3/go.mod h1:uHL0TQwJ0xaV2/snJOJV6hSE4yRmhhfymuYgNredGxU=
 github.com/gomlx/go-huggingface v0.2.0 h1:qEWqZ7eYwwSqJk7Y5g9bYKf6qRTu8CRWFQCT79NvM70=
 github.com/gomlx/go-huggingface v0.2.0/go.mod h1:pSI9KFkGVksYYnNNO5lqLPBR0hzboFQb2FGrpGjseIY=
-github.com/gomlx/gomlx v0.19.2 h1:iK8DtMU91Kgc9ez9fu2xBnfozsjkaCXVfJuMz3UvjEI=
-github.com/gomlx/gomlx v0.19.2/go.mod h1:RdhIh7sixw3HWFevfiM7DOPu2SAATjKcOzBI/ZV7Inc=
-github.com/gomlx/gopjrt v0.7.0 h1:7TwlK+mRGTkqQYHemxwzIPGGIG9Q8fN7GnmqRspRMHY=
-github.com/gomlx/gopjrt v0.7.0/go.mod h1:HJn0wemLuFPxHr7P7zvuiloLR2OsLv60HV/4obxTXVc=
-github.com/gomlx/onnx-gomlx v0.2.1 h1:n7LHC+dFRi2pZeyOIK7nAUM+Gmh1oPOdruSm6wUhbtk=
-github.com/gomlx/onnx-gomlx v0.2.1/go.mod h1:2vcxuS5NJ2zbNBFGBYxR59aRydIzBZw6a10FCY1kjGY=
+github.com/gomlx/gomlx v0.19.4 h1:71I3VeBS00IUUBZcE9mZxmMx65qL7O3CtumaHK6ghp0=
+github.com/gomlx/gomlx v0.19.4/go.mod h1:6zkDUqqdEl16DgoVZrTaEH643gf3wvQFAknnGgFQXOE=
+github.com/gomlx/gopjrt v0.7.1 h1:OGZbMN7CCn2dU+CDr65InDO0XPmrC5NUnJ9STXa/lXE=
+github.com/gomlx/gopjrt v0.7.1/go.mod h1:VswjttDY1uSllQ+Vs69P4kgsH3EkFEHADUCdDbfgh0Y=
+github.com/gomlx/onnx-gomlx v0.2.2 h1:D5HqzRiaAcPscj/tgVY9jG33jdcKo00AL4BB2mIVoi4=
+github.com/gomlx/onnx-gomlx v0.2.2/go.mod h1:T1HIeH7sXQOmi2ZkIfc0pjBglTkDBBeXMeF0vHjTPKk=
 github.com/google/go-cmp v0.6.0 h1:ofyhxvXcZhMsU5ulbFiLKl/XBFqE1GSq7atu8tAmTRI=
 github.com/google/go-cmp v0.6.0/go.mod h1:17dUlkBOakJ0+DkrSSNjCkIjxS6bF9zb3elmeNGIjoY=
 github.com/google/gofuzz v1.0.0/go.mod h1:dBl0BpW6vV/+mYPU4Po3pmUjxk6FQPldtuIdl/M65Eg=
@@ -65,8 +65,8 @@ github.com/x448/float16 v0.8.4 h1:qLwI1I70+NjRFUR3zs1JPUCgaCXSh3SW62uAKT1mSBM=
 github.com/x448/float16 v0.8.4/go.mod h1:14CWIYCyZA/cWjXOioeEpHeN/83MdbZDRQHoFcYsOfg=
 github.com/xrash/smetrics v0.0.0-20240521201337-686a1a2994c1 h1:gEOO8jv9F4OT7lGCjxCBTO/36wtF6j2nSip77qHd4x4=
 github.com/xrash/smetrics v0.0.0-20240521201337-686a1a2994c1/go.mod h1:Ohn+xnUBiLI6FVj/9LpzZWtj1/D6lUovWYBkxHVV3aM=
-github.com/yalue/onnxruntime_go v1.19.0 h1:+qCu7/Nzrr/TY7B3sMy9sOATegP2qbtXn4b7q90fDOo=
-github.com/yalue/onnxruntime_go v1.19.0/go.mod h1:b4X26A8pekNb1ACJ58wAXgNKeUCGEAQ9dmACut9Sm/4=
+github.com/yalue/onnxruntime_go v1.19.1-0.20250521134902-f70a71e4f522 h1:rpmBrqsPv6Wcsg/LIU0dIbdMn5QPv+TNoDqFNwWttEc=
+github.com/yalue/onnxruntime_go v1.19.1-0.20250521134902-f70a71e4f522/go.mod h1:b4X26A8pekNb1ACJ58wAXgNKeUCGEAQ9dmACut9Sm/4=
 golang.org/x/crypto v0.38.0 h1:jt+WWG8IZlBnVbomuhg2Mdq0+BBQaHbtqHEFEigjUV8=
 golang.org/x/crypto v0.38.0/go.mod h1:MvrbAqul58NNYPKnOra203SB9vpuZW0e+RRZV+Ggqjw=
 golang.org/x/exp v0.0.0-20250506013437-ce4c2cf36ca6 h1:y5zboxd6LQAqYIhHnB48p0ByQ/GnQx2BE33L8BOHQkI=
diff --git a/util/file.go b/util/file.go
@@ -121,7 +121,3 @@ func NewFileWriter(filename string, contentType string) (io.WriteCloser, error)
 	}
 	return fileSystem.NewWriter(context.Background(), filename, 0644, option.NewSkipChecksum(true))
 }
-
-func MoveFile(from string, to string) error {
-	return fileSystem.Move(context.Background(), from, to, option.NewSource(option.NewStream(partSize, 0)), option.NewDest(option.NewSkipChecksum(true)))
-}

Original file line number	Diff line number	Diff line change
`@@ -121,7 +121,3 @@ func NewFileWriter(filename string, contentType string) (io.WriteCloser, error)`
`121`	`121`	`}`
`122`	`122`	`return fileSystem.NewWriter(context.Background(), filename, 0644, option.NewSkipChecksum(true))`
`123`	`123`	`}`
`124`		`-`
`125`		`-func MoveFile(from string, to string) error {`
`126`		`- return fileSystem.Move(context.Background(), from, to, option.NewSource(option.NewStream(partSize, 0)), option.NewDest(option.NewSkipChecksum(true)))`
`127`		`-}`