PoshCode Archive  Artifact [aad7c2aed3]

Artifact aad7c2aed3bd4ef4b95f0dab157d80eb65148dfa66972a30b3b38bd19a2f4549:

  • File Get-FileEncoding.ps1 — part of check-in [698c2bd3dd] at 2018-06-10 13:22:31 on branch trunk — Get-FileEncoding function determines encoding by looking at Byte Order Mark (BOM). (user: RyanFisher size: 1986)

# encoding: ascii
# api: powershell
# title: Get-FileEncoding
# description: Get-FileEncoding function determines encoding by looking at Byte Order Mark (BOM).
# version: 0.1
# type: script
# author: RyanFisher
# license: CC0
# function: Get-FileEncoding
# x-poshcode-id: 3227
# x-archived: 2012-02-13T11:11:44
# x-published: 2012-02-11T07:32:00
#
#
<#
.SYNOPSIS
Gets file encoding.
.DESCRIPTION
The Get-FileEncoding function determines encoding by looking at Byte Order Mark (BOM).
Based on port of C# code from http://www.west-wind.com/Weblog/posts/197245.aspx
.EXAMPLE
Get-ChildItem  *.ps1 | select FullName, @{n='Encoding';e={Get-FileEncoding $_.FullName}} | where {$_.Encoding -ne 'ASCII'}
This command gets ps1 files in current directory where encoding is not ASCII
.EXAMPLE
Get-ChildItem  *.ps1 | select FullName, @{n='Encoding';e={Get-FileEncoding $_.FullName}} | where {$_.Encoding -ne 'ASCII'} | foreach {(get-content $_.FullName) | set-content $_.FullName -Encoding ASCII}
Same as previous example but fixes encoding using set-content
#>
function Get-FileEncoding
{
    [CmdletBinding()] Param (
     [Parameter(Mandatory = $True, ValueFromPipelineByPropertyName = $True)] [string]$Path
    )

    [byte[]]$byte = get-content -Encoding byte -ReadCount 4 -TotalCount 4 -Path $Path

    if ($byte.count -ge 0)
    {
    	if ( $byte[0] -eq 0xef -and $byte[1] -eq 0xbb -and $byte[2] -eq 0xbf )
        	{ $encoding = 'UTF8' }  
    	elseif ($byte[0] -eq 0xfe -and $byte[1] -eq 0xff)
        	{ $encoding = 'BigEndianUnicode' }
    	elseif ($byte[0] -eq 0xff -and $byte[1] -eq 0xfe)
        	{ $encoding = 'Unicode' }
    	elseif ($byte[0] -eq 0 -and $byte[1] -eq 0 -and $byte[2] -eq 0xfe -and $byte[3] -eq 0xff)
        	{ $encoding = 'UTF32' }
    	elseif ($byte[0] -eq 0x2b -and $byte[1] -eq 0x2f -and $byte[2] -eq 0x76)
        	{ $encoding = 'UTF7'}
    	else
        	{ $encoding = 'ASCII' }
    	return $encoding
    }
}