fix(lint): auto-fix comment periods with godot tool

jackspirou · jackspirou · commit 79d5d574d410 · 2025-08-01T12:39:53.000-05:00
Run godot -w to automatically add missing periods to comments
diff --git a/llama3/cmd/llama3/decode.go b/llama3/cmd/llama3/decode.go
@@ -12,11 +12,11 @@ import (
 )
 
 var (
-	// Decode command flags
+	// Decode command flags.
 	decSkipSpecial bool
 )
 
-// newDecodeCmd creates the decode subcommand
+// newDecodeCmd creates the decode subcommand.
 func newDecodeCmd() *cobra.Command {
 	cmd := &cobra.Command{
 		Use:   "decode [token_ids...]",
diff --git a/llama3/cmd/llama3/encode.go b/llama3/cmd/llama3/encode.go
@@ -12,13 +12,13 @@ import (
 )
 
 var (
-	// Encode command flags
+	// Encode command flags.
 	encAddBOS bool
 	encAddEOS bool
 	encOutput string
 )
 
-// newEncodeCmd creates the encode subcommand
+// newEncodeCmd creates the encode subcommand.
 func newEncodeCmd() *cobra.Command {
 	cmd := &cobra.Command{
 		Use:   "encode [text]",
diff --git a/llama3/cmd/llama3/info.go b/llama3/cmd/llama3/info.go
@@ -7,7 +7,7 @@ import (
 	"github.com/spf13/cobra"
 )
 
-// newInfoCmd creates the info subcommand
+// newInfoCmd creates the info subcommand.
 func newInfoCmd() *cobra.Command {
 	cmd := &cobra.Command{
 		Use:   "info",
diff --git a/llama3/cmd/llama3/stream.go b/llama3/cmd/llama3/stream.go
@@ -9,15 +9,15 @@ import (
 )
 
 var (
-	// Stream command flags
+	// Stream command flags.
 	streamBufferSize int
 	streamMaxBuffer  int
 	streamAddBOS     bool
 	streamAddEOS     bool
 	streamOutput     string
 )
 
-// newStreamCmd creates the stream subcommand
+// newStreamCmd creates the stream subcommand.
 func newStreamCmd() *cobra.Command {
 	cmd := &cobra.Command{
 		Use:   "stream",
diff --git a/llama3/comparison_test.go b/llama3/comparison_test.go
@@ -11,19 +11,19 @@ import (
 	"testing"
 )
 
-// ComparisonTestCase represents a test case for comparing Go and JS implementations
+// ComparisonTestCase represents a test case for comparing Go and JS implementations.
 type ComparisonTestCase struct {
 	Input    string `json:"input"`
 	Expected []int  `json:"expected"`
 }
 
-// toJSON converts a value to JSON string
+// toJSON converts a value to JSON string.
 func toJSON(v interface{}) string {
 	b, _ := json.Marshal(v)
 	return string(b)
 }
 
-// generateTestVectors creates a JavaScript file to generate test vectors
+// generateTestVectors creates a JavaScript file to generate test vectors.
 func generateTestVectors(testCases []string) ([]ComparisonTestCase, error) {
 	// Create temporary JS file
 	tmpDir := os.TempDir()
@@ -62,7 +62,7 @@ console.log(JSON.stringify(results, null, 2));
 	return results, nil
 }
 
-// TestComparisonWithJS compares Go implementation with JavaScript implementation
+// TestComparisonWithJS compares Go implementation with JavaScript implementation.
 func TestComparisonWithJS(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
@@ -208,7 +208,7 @@ func TestComparisonWithJS(t *testing.T) {
 	}
 }
 
-// TestComparisonFromFile tests using test vectors from a file
+// TestComparisonFromFile tests using test vectors from a file.
 func TestComparisonFromFile(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
@@ -270,7 +270,7 @@ func TestComparisonFromFile(t *testing.T) {
 	}
 }
 
-// generateTestVectorFile creates a file with test vectors for future use
+// generateTestVectorFile creates a file with test vectors for future use.
 func generateTestVectorFile(filename string, count int) error {
 	// Generate diverse test inputs
 	var inputs []string
diff --git a/llama3/compatibility_test.go b/llama3/compatibility_test.go
@@ -12,7 +12,7 @@ import (
 	testutils "github.com/agentstation/tokenizer/llama3/internal/testing"
 )
 
-// TestCompatibility runs comprehensive compatibility tests with 476 test cases
+// TestCompatibility runs comprehensive compatibility tests with 476 test cases.
 func TestCompatibility(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
@@ -96,7 +96,7 @@ func TestCompatibility(t *testing.T) {
 		float64(totalPassed)*100/float64(totalPassed+totalFailed))
 }
 
-// getJSTokenization gets tokenization results from JavaScript implementation
+// getJSTokenization gets tokenization results from JavaScript implementation.
 func getJSTokenization(inputs []string, jsPath string) ([][]int, error) {
 	// Create temporary JS file
 	tmpDir := os.TempDir()
@@ -134,7 +134,7 @@ console.log(JSON.stringify(results));
 	return results, nil
 }
 
-// compareTokens compares two token arrays
+// compareTokens compares two token arrays.
 func compareTokens(a, b []int) bool {
 	if len(a) != len(b) {
 		return false
@@ -147,7 +147,7 @@ func compareTokens(a, b []int) bool {
 	return true
 }
 
-// TestTokenizationProperties tests properties that should hold for all inputs
+// TestTokenizationProperties tests properties that should hold for all inputs.
 func TestTokenizationProperties(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
@@ -185,7 +185,7 @@ func TestTokenizationProperties(t *testing.T) {
 	}
 }
 
-// BenchmarkCases benchmarks various categories of inputs
+// BenchmarkCases benchmarks various categories of inputs.
 func BenchmarkCases(b *testing.B) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
diff --git a/llama3/errors.go b/llama3/errors.go
@@ -5,22 +5,22 @@ import (
 	"fmt"
 )
 
-// Common errors
+// Common errors.
 var (
-	// ErrDataNotFound indicates that the tokenizer data files could not be found
+	// ErrDataNotFound indicates that the tokenizer data files could not be found.
 	ErrDataNotFound = errors.New("tokenizer data not found")
 
-	// ErrInvalidToken indicates an invalid token was provided
+	// ErrInvalidToken indicates an invalid token was provided.
 	ErrInvalidToken = errors.New("invalid token")
 
-	// ErrTokenNotFound indicates a token was not found in the vocabulary
+	// ErrTokenNotFound indicates a token was not found in the vocabulary.
 	ErrTokenNotFound = errors.New("token not found")
 
-	// ErrInvalidTokenID indicates an invalid token ID was provided
+	// ErrInvalidTokenID indicates an invalid token ID was provided.
 	ErrInvalidTokenID = errors.New("invalid token ID")
 )
 
-// DataError represents an error related to tokenizer data loading or processing
+// DataError represents an error related to tokenizer data loading or processing.
 type DataError struct {
 	Op   string // Operation that failed
 	Path string // File path if applicable
@@ -38,7 +38,7 @@ func (e *DataError) Unwrap() error {
 	return e.Err
 }
 
-// TokenError represents an error related to token operations
+// TokenError represents an error related to token operations.
 type TokenError struct {
 	Token   string // The token that caused the error
 	TokenID int    // The token ID if applicable
@@ -60,7 +60,7 @@ func (e *TokenError) Unwrap() error {
 	return e.Err
 }
 
-// ConfigError represents an error in tokenizer configuration
+// ConfigError represents an error in tokenizer configuration.
 type ConfigError struct {
 	Field string // Configuration field that has an error
 	Value any    // The invalid value
@@ -77,22 +77,22 @@ func (e *ConfigError) Unwrap() error {
 
 // Helper functions for creating errors
 
-// NewDataError creates a new DataError
+// NewDataError creates a new DataError.
 func NewDataError(op, path string, err error) error {
 	return &DataError{Op: op, Path: path, Err: err}
 }
 
-// NewTokenError creates a new TokenError
+// NewTokenError creates a new TokenError.
 func NewTokenError(op, token string, err error) error {
 	return &TokenError{Op: op, Token: token, Err: err}
 }
 
-// NewTokenIDError creates a new TokenError with a token ID
+// NewTokenIDError creates a new TokenError with a token ID.
 func NewTokenIDError(op string, tokenID int, err error) error {
 	return &TokenError{Op: op, TokenID: tokenID, Err: err}
 }
 
-// NewConfigError creates a new ConfigError
+// NewConfigError creates a new ConfigError.
 func NewConfigError(field string, value any, err error) error {
 	return &ConfigError{Field: field, Value: value, Err: err}
 }
diff --git a/llama3/internal/pretokenizer/state_machine_test.go b/llama3/internal/pretokenizer/state_machine_test.go
@@ -1070,7 +1070,7 @@ func TestCharacterClassification(t *testing.T) {
 	})
 }
 
-// Benchmark tests to ensure performance hasn't regressed
+// Benchmark tests to ensure performance hasn't regressed.
 func BenchmarkTokenizeLongText(b *testing.B) {
 	// Create a realistic long text
 	parts := []string{
@@ -1121,7 +1121,7 @@ func BenchmarkTokenizeWhitespaceHeavyTable(b *testing.B) {
 	}
 }
 
-// TestStateMachineJavaScriptCompatibility tests cases from JavaScript output
+// TestStateMachineJavaScriptCompatibility tests cases from JavaScript output.
 func TestStateMachineJavaScriptCompatibility(t *testing.T) {
 	testCases := []struct {
 		input    string
diff --git a/llama3/internal/tokens/special.go b/llama3/internal/tokens/special.go
@@ -7,10 +7,10 @@ import (
 )
 
 var (
-	// SpecialTokenRegex matches Llama 3 special tokens
+	// SpecialTokenRegex matches Llama 3 special tokens.
 	SpecialTokenRegex = regexp.MustCompile(`<\|(?:begin_of_text|end_of_text|start_header_id|end_header_id|eot_id|eom_id|python_tag|finetune_right_pad_id|reserved_special_token_(?:[0-9]|[1-9][0-9]|1[0-9][0-9]|2[0-3][0-9]|24[0-7]))\|>`)
 
-	// OptimisticSpecialTokenRegex matches any pattern that looks like a special token
+	// OptimisticSpecialTokenRegex matches any pattern that looks like a special token.
 	OptimisticSpecialTokenRegex = regexp.MustCompile(`<\|[a-zA-Z0-9_]+\|>`)
 )
 
diff --git a/llama3/internal/vocabulary/decoder.go b/llama3/internal/vocabulary/decoder.go
@@ -7,7 +7,7 @@ import (
 )
 
 const (
-	// bitsPerMergeID is the number of bits used to encode each merge ID
+	// bitsPerMergeID is the number of bits used to encode each merge ID.
 	bitsPerMergeID = 17
 )
 
diff --git a/llama3/options.go b/llama3/options.go
@@ -2,7 +2,7 @@ package llama3
 
 import "strings"
 
-// config holds configuration during tokenizer creation
+// config holds configuration during tokenizer creation.
 type config struct {
 	dataLoader    VocabularyDataLoader
 	specialTokens []string
diff --git a/llama3/scanner.go b/llama3/scanner.go
@@ -28,7 +28,7 @@ type Scanner interface {
 // ScannerOption configures scanner behavior.
 type ScannerOption = scanner.Option
 
-// Scanner option functions - these are re-exported from the scanner package
+// Scanner option functions - these are re-exported from the scanner package.
 var (
 	// WithBufferSize sets the internal buffer size for reading.
 	// Default is 4096 bytes.
@@ -48,12 +48,12 @@ var (
 	}
 )
 
-// tokenizerAdapter adapts Tokenizer to the scanner.Tokenizer interface
+// tokenizerAdapter adapts Tokenizer to the scanner.Tokenizer interface.
 type tokenizerAdapter struct {
 	*Tokenizer
 }
 
-// Encode adapts the Encode method
+// Encode adapts the Encode method.
 func (ta *tokenizerAdapter) Encode(text string, opts *scanner.EncodeOptions) []int {
 	return ta.Tokenizer.Encode(text, &EncodeOptions{
 		BOS: opts.BOS,
diff --git a/llama3/tokenizer.go b/llama3/tokenizer.go
@@ -12,7 +12,7 @@ import (
 
 // Internal utility functions and variables
 
-// Exposed encoding functions for backward compatibility
+// Exposed encoding functions for backward compatibility.
 var (
 	// encodeBytes converts UTF-8 bytes to the custom byte-level representation.
 	encodeBytes = encoding.EncodeBytes
@@ -21,12 +21,12 @@ var (
 	decodeTokenBytes = encoding.DecodeTokenBytes
 )
 
-// Special token handling
+// Special token handling.
 var (
-	// specialTokenRegex matches Llama 3 special tokens
+	// specialTokenRegex matches Llama 3 special tokens.
 	specialTokenRegex = tokens.SpecialTokenRegex
 
-	// optimisticSpecialTokenRegex matches any pattern that looks like a special token
+	// optimisticSpecialTokenRegex matches any pattern that looks like a special token.
 	optimisticSpecialTokenRegex = tokens.OptimisticSpecialTokenRegex
 )
 
@@ -426,7 +426,7 @@ func (t *Tokenizer) getMergeIdentifier(firstTokenID, secondTokenID int) string {
 	return t.tokens[firstTokenID] + " " + t.tokens[secondTokenID]
 }
 
-// Ensure Tokenizer implements Encoder and Decoder interfaces
+// Ensure Tokenizer implements Encoder and Decoder interfaces.
 var (
 	_ Encoder      = (*Tokenizer)(nil)
 	_ Decoder      = (*Tokenizer)(nil)
diff --git a/llama3/tokenizer_test.go b/llama3/tokenizer_test.go
@@ -345,7 +345,7 @@ func TestLargeText(t *testing.T) {
 	}
 }
 
-// TestEncodeBytesMethod tests the EncodeBytes method
+// TestEncodeBytesMethod tests the EncodeBytes method.
 func TestEncodeBytesMethod(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
@@ -364,7 +364,7 @@ func TestEncodeBytesMethod(t *testing.T) {
 	}
 }
 
-// TestAppendTokensMethod tests the AppendTokens method
+// TestAppendTokensMethod tests the AppendTokens method.
 func TestAppendTokensMethod(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
@@ -405,7 +405,7 @@ func TestAppendTokensMethod(t *testing.T) {
 	})
 }
 
-// TestOptimisticCount tests the OptimisticCount method
+// TestOptimisticCount tests the OptimisticCount method.
 func TestOptimisticCount(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
@@ -444,7 +444,7 @@ func TestOptimisticCount(t *testing.T) {
 	}
 }
 
-// TestDecodeBytesMethod tests the DecodeBytes method
+// TestDecodeBytesMethod tests the DecodeBytes method.
 func TestDecodeBytesMethod(t *testing.T) {
 	tokenizer, err := New()
 	if err != nil || tokenizer.VocabSize() == 0 {
diff --git a/llama3/vocab.go b/llama3/vocab.go
@@ -103,7 +103,7 @@ func (f *fileVocabularySource) LoadMerges() (map[string]int, error) {
 	return merges, nil
 }
 
-// fileLoaderMarker is a placeholder that will be replaced with the actual file loader
+// fileLoaderMarker is a placeholder that will be replaced with the actual file loader.
 type fileLoaderMarker struct {
 	vocabPath  string
 	mergesPath string

Original file line number	Diff line number	Diff line change
`@@ -12,11 +12,11 @@ import (`
`12`	`12`	`)`
`13`	`13`
`14`	`14`	`var (`
`15`		`- // Decode command flags`
	`15`	`+ // Decode command flags.`
`16`	`16`	`decSkipSpecial bool`
`17`	`17`	`)`
`18`	`18`
`19`		`-// newDecodeCmd creates the decode subcommand`
	`19`	`+// newDecodeCmd creates the decode subcommand.`
`20`	`20`	`func newDecodeCmd() *cobra.Command {`
`21`	`21`	`cmd := &cobra.Command{`
`22`	`22`	`Use: "decode [token_ids...]",`
Original file line number	Diff line number	Diff line change
`@@ -12,13 +12,13 @@ import (`
`12`	`12`	`)`
`13`	`13`
`14`	`14`	`var (`
`15`		`- // Encode command flags`
	`15`	`+ // Encode command flags.`
`16`	`16`	`encAddBOS bool`
`17`	`17`	`encAddEOS bool`
`18`	`18`	`encOutput string`
`19`	`19`	`)`
`20`	`20`
`21`		`-// newEncodeCmd creates the encode subcommand`
	`21`	`+// newEncodeCmd creates the encode subcommand.`
`22`	`22`	`func newEncodeCmd() *cobra.Command {`
`23`	`23`	`cmd := &cobra.Command{`
`24`	`24`	`Use: "encode [text]",`
Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ import (`
`7`	`7`	`"github.com/spf13/cobra"`
`8`	`8`	`)`
`9`	`9`
`10`		`-// newInfoCmd creates the info subcommand`
	`10`	`+// newInfoCmd creates the info subcommand.`
`11`	`11`	`func newInfoCmd() *cobra.Command {`
`12`	`12`	`cmd := &cobra.Command{`
`13`	`13`	`Use: "info",`
Original file line number	Diff line number	Diff line change
`@@ -11,19 +11,19 @@ import (`
`11`	`11`	`"testing"`
`12`	`12`	`)`
`13`	`13`
`14`		`-// ComparisonTestCase represents a test case for comparing Go and JS implementations`
	`14`	`+// ComparisonTestCase represents a test case for comparing Go and JS implementations.`
`15`	`15`	`type ComparisonTestCase struct {`
`16`	`16`	Input string `json:"input"`
`17`	`17`	Expected []int `json:"expected"`
`18`	`18`	`}`
`19`	`19`
`20`		`-// toJSON converts a value to JSON string`
	`20`	`+// toJSON converts a value to JSON string.`
`21`	`21`	`func toJSON(v interface{}) string {`
`22`	`22`	`b, _ := json.Marshal(v)`
`23`	`23`	`return string(b)`
`24`	`24`	`}`
`25`	`25`
`26`		`-// generateTestVectors creates a JavaScript file to generate test vectors`
	`26`	`+// generateTestVectors creates a JavaScript file to generate test vectors.`
`27`	`27`	`func generateTestVectors(testCases []string) ([]ComparisonTestCase, error) {`
`28`	`28`	`// Create temporary JS file`
`29`	`29`	`tmpDir := os.TempDir()`
`@@ -62,7 +62,7 @@ console.log(JSON.stringify(results, null, 2));`
`62`	`62`	`return results, nil`
`63`	`63`	`}`
`64`	`64`
`65`		`-// TestComparisonWithJS compares Go implementation with JavaScript implementation`
	`65`	`+// TestComparisonWithJS compares Go implementation with JavaScript implementation.`
`66`	`66`	`func TestComparisonWithJS(t *testing.T) {`
`67`	`67`	`tokenizer, err := New()`
`68`	`68`	`if err != nil \|\| tokenizer.VocabSize() == 0 {`
`@@ -208,7 +208,7 @@ func TestComparisonWithJS(t *testing.T) {`
`208`	`208`	`}`
`209`	`209`	`}`
`210`	`210`
`211`		`-// TestComparisonFromFile tests using test vectors from a file`
	`211`	`+// TestComparisonFromFile tests using test vectors from a file.`
`212`	`212`	`func TestComparisonFromFile(t *testing.T) {`
`213`	`213`	`tokenizer, err := New()`
`214`	`214`	`if err != nil \|\| tokenizer.VocabSize() == 0 {`
`@@ -270,7 +270,7 @@ func TestComparisonFromFile(t *testing.T) {`
`270`	`270`	`}`
`271`	`271`	`}`
`272`	`272`
`273`		`-// generateTestVectorFile creates a file with test vectors for future use`
	`273`	`+// generateTestVectorFile creates a file with test vectors for future use.`
`274`	`274`	`func generateTestVectorFile(filename string, count int) error {`
`275`	`275`	`// Generate diverse test inputs`
`276`	`276`	`var inputs []string`
Original file line number	Diff line number	Diff line change
`@@ -1070,7 +1070,7 @@ func TestCharacterClassification(t *testing.T) {`
`1070`	`1070`	`})`
`1071`	`1071`	`}`
`1072`	`1072`
`1073`		`-// Benchmark tests to ensure performance hasn't regressed`
	`1073`	`+// Benchmark tests to ensure performance hasn't regressed.`
`1074`	`1074`	`func BenchmarkTokenizeLongText(b *testing.B) {`
`1075`	`1075`	`// Create a realistic long text`
`1076`	`1076`	`parts := []string{`
`@@ -1121,7 +1121,7 @@ func BenchmarkTokenizeWhitespaceHeavyTable(b *testing.B) {`
`1121`	`1121`	`}`
`1122`	`1122`	`}`
`1123`	`1123`
`1124`		`-// TestStateMachineJavaScriptCompatibility tests cases from JavaScript output`
	`1124`	`+// TestStateMachineJavaScriptCompatibility tests cases from JavaScript output.`
`1125`	`1125`	`func TestStateMachineJavaScriptCompatibility(t *testing.T) {`
`1126`	`1126`	`testCases := []struct {`
`1127`	`1127`	`input string`
Original file line number	Diff line number	Diff line change
`@@ -7,10 +7,10 @@ import (`
`7`	`7`	`)`
`8`	`8`
`9`	`9`	`var (`
`10`		`- // SpecialTokenRegex matches Llama 3 special tokens`
	`10`	`+ // SpecialTokenRegex matches Llama 3 special tokens.`
`11`	`11`	SpecialTokenRegex = regexp.MustCompile(`<\\|(?:begin_of_text\|end_of_text\|start_header_id\|end_header_id\|eot_id\|eom_id\|python_tag\|finetune_right_pad_id\|reserved_special_token_(?:[0-9]\|[1-9][0-9]\|1[0-9][0-9]\|2[0-3][0-9]\|24[0-7]))\\|>`)
`12`	`12`
`13`		`- // OptimisticSpecialTokenRegex matches any pattern that looks like a special token`
	`13`	`+ // OptimisticSpecialTokenRegex matches any pattern that looks like a special token.`
`14`	`14`	OptimisticSpecialTokenRegex = regexp.MustCompile(`<\\|[a-zA-Z0-9_]+\\|>`)
`15`	`15`	`)`
`16`	`16`
Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ import (`
`7`	`7`	`)`
`8`	`8`
`9`	`9`	`const (`
`10`		`- // bitsPerMergeID is the number of bits used to encode each merge ID`
	`10`	`+ // bitsPerMergeID is the number of bits used to encode each merge ID.`
`11`	`11`	`bitsPerMergeID = 17`
`12`	`12`	`)`
`13`	`13`