From 04308dcaa1c5bd005f8519269b15d6d1da2a5fba Mon Sep 17 00:00:00 2001 From: Nick Craig-Wood Date: Wed, 30 Sep 2020 16:24:50 +0100 Subject: [PATCH] local: add --local-unicode-normalization (and remove --local-no-unicode-normalization) macOS stores files in NFD form and transferring them like this to some systems causes the Korean language to display incorrectly. This adds the flag --local-unicode-normalization to optionally normalize the file names to NFC. This also removes the (long deprecated) --local-no-unicode-normalization flag See: https://forum.rclone.org/t/support-for-korean-jaso-conversion/19435 --- backend/local/local.go | 29 +++++++++++++++++++---------- 1 file changed, 19 insertions(+), 10 deletions(-) diff --git a/backend/local/local.go b/backend/local/local.go index 476e3cc89..01fed30a3 100644 --- a/backend/local/local.go +++ b/backend/local/local.go @@ -27,6 +27,7 @@ import ( "github.com/rclone/rclone/lib/encoder" "github.com/rclone/rclone/lib/file" "github.com/rclone/rclone/lib/readers" + "golang.org/x/text/unicode/norm" ) // Constants @@ -86,12 +87,21 @@ So rclone now always reads the link Default: false, Advanced: true, }, { - Name: "no_unicode_normalization", - Help: `Don't apply unicode normalization to paths and filenames (Deprecated) + Name: "unicode_normalization", + Help: `Apply unicode NFC normalization to paths and filenames -This flag is deprecated now. Rclone no longer normalizes unicode file -names, but it compares them with unicode normalization in the sync -routine instead.`, +This flag can be used to normalize file names into unicode NFC form +that are read from the local filesystem. + +Rclone does not normally touch the encoding of file names it reads from +the file system. + +This can be useful when using macOS as it normally provides decomposed (NFD) +unicode which in some language (eg Korean) doesn't display properly on +some OSes. + +Note that rclone compares filenames with unicode normalization in the sync +routine so this flag shouldn't normally be used.`, Default: false, Advanced: true, }, { @@ -196,7 +206,7 @@ type Options struct { FollowSymlinks bool `config:"copy_links"` TranslateSymlinks bool `config:"links"` SkipSymlinks bool `config:"skip_links"` - NoUTFNorm bool `config:"no_unicode_normalization"` + UTFNorm bool `config:"unicode_normalization"` NoCheckUpdated bool `config:"no_check_updated"` NoUNC bool `config:"nounc"` OneFileSystem bool `config:"one_file_system"` @@ -255,10 +265,6 @@ func NewFs(ctx context.Context, name, root string, m configmap.Mapper) (fs.Fs, e return nil, errLinksAndCopyLinks } - if opt.NoUTFNorm { - fs.Errorf(nil, "The --local-no-unicode-normalization flag is deprecated and will be removed") - } - f := &Fs{ name: name, opt: *opt, @@ -521,6 +527,9 @@ func (f *Fs) List(ctx context.Context, dir string) (entries fs.DirEntries, err e } func (f *Fs) cleanRemote(dir, filename string) (remote string) { + if f.opt.UTFNorm { + filename = norm.NFC.String(filename) + } remote = path.Join(dir, f.opt.Enc.ToStandardName(filename)) if !utf8.ValidString(filename) {