Public/ConvertTo-Token.ps1
function ConvertTo-Token { [CmdletBinding(DefaultParameterSetName = 'encoding')] [OutputType([int[]])] param ( [Parameter(Mandatory, Position = 0, ValueFromPipeline)] [AllowEmptyString()] [string]$Text, [Parameter(Mandatory, Position = 1, ParameterSetName = 'model')] [string][LowerCaseTransformation()]$Model, [Parameter(Mandatory = $false, Position = 1, ParameterSetName = 'encoding')] [ValidateSet('cl100k_base', 'o200k_base')] [string]$Encoding = 'cl100k_base' ) begin { if ($PSCmdlet.ParameterSetName -eq 'Model') { if ([string]::IsNullOrWhiteSpace($Model)) { Write-Error -Exception ([System.ArgumentException]::new('The model name not specifed properly.')) return } # Convert model name to encoding name $Encoding = Convert-ModelToEncoding -Model $Model if (-not $Encoding) { Write-Error -Exception ([System.ArgumentException]::new('The model name not specifed properly.')) return } } $Encoder = switch ($Encoding) { 'cl100k_base' { [PSOpenAI.TokenizerLib.Cl100kBaseTokenizer]::Encode } 'o200k_base' { [PSOpenAI.TokenizerLib.O200kBaseTokenizer]::Encode } } } process { try { , $Encoder.Invoke($Text).ToArray() } catch { Write-Error -Exception $_.Exception } } end {} } |