The `ToUTF8*` functions were stripping BOM, while BOM is actually valid in UTF8, so the stripping must be optional depending on use case. This does: - Add a options struct to all `ToUTF8*` functions, that by default will strip BOM to preserve existing behaviour - Remove `ToUTF8` function, it was dead code - Rename `ToUTF8WithErr` to `ToUTF8` - Preserve BOM in Monaco Editor - Remove a unnecessary newline in the textarea value. Browsers did ignore it, it seems but it's better not to rely on this behaviour. Fixes: https://github.com/go-gitea/gitea/issues/28743 Related: https://github.com/go-gitea/gitea/issues/6716 which seems to have once introduced a mechanism that strips and re-adds the BOM, but from what I can tell, this mechanism was removed at some point after that PR.
		
			
				
	
	
		
			78 lines
		
	
	
		
			1.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			78 lines
		
	
	
		
			1.9 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| // Copyright 2022 The Gitea Authors. All rights reserved.
 | |
| // SPDX-License-Identifier: MIT
 | |
| 
 | |
| package repo
 | |
| 
 | |
| import (
 | |
| 	"bytes"
 | |
| 	"io"
 | |
| 	"net/http"
 | |
| 	"path"
 | |
| 
 | |
| 	"code.gitea.io/gitea/modules/charset"
 | |
| 	"code.gitea.io/gitea/modules/context"
 | |
| 	"code.gitea.io/gitea/modules/git"
 | |
| 	"code.gitea.io/gitea/modules/markup"
 | |
| 	"code.gitea.io/gitea/modules/typesniffer"
 | |
| 	"code.gitea.io/gitea/modules/util"
 | |
| )
 | |
| 
 | |
| // RenderFile renders a file by repos path
 | |
| func RenderFile(ctx *context.Context) {
 | |
| 	blob, err := ctx.Repo.Commit.GetBlobByPath(ctx.Repo.TreePath)
 | |
| 	if err != nil {
 | |
| 		if git.IsErrNotExist(err) {
 | |
| 			ctx.NotFound("GetBlobByPath", err)
 | |
| 		} else {
 | |
| 			ctx.ServerError("GetBlobByPath", err)
 | |
| 		}
 | |
| 		return
 | |
| 	}
 | |
| 
 | |
| 	dataRc, err := blob.DataAsync()
 | |
| 	if err != nil {
 | |
| 		ctx.ServerError("DataAsync", err)
 | |
| 		return
 | |
| 	}
 | |
| 	defer dataRc.Close()
 | |
| 
 | |
| 	buf := make([]byte, 1024)
 | |
| 	n, _ := util.ReadAtMost(dataRc, buf)
 | |
| 	buf = buf[:n]
 | |
| 
 | |
| 	st := typesniffer.DetectContentType(buf)
 | |
| 	isTextFile := st.IsText()
 | |
| 
 | |
| 	rd := charset.ToUTF8WithFallbackReader(io.MultiReader(bytes.NewReader(buf), dataRc), charset.ConvertOpts{})
 | |
| 
 | |
| 	if markupType := markup.Type(blob.Name()); markupType == "" {
 | |
| 		if isTextFile {
 | |
| 			_, err = io.Copy(ctx.Resp, rd)
 | |
| 			if err != nil {
 | |
| 				ctx.ServerError("Copy", err)
 | |
| 			}
 | |
| 			return
 | |
| 		}
 | |
| 		ctx.Error(http.StatusInternalServerError, "Unsupported file type render")
 | |
| 		return
 | |
| 	}
 | |
| 
 | |
| 	ctx.Resp.Header().Add("Content-Security-Policy", "frame-src 'self'; sandbox allow-scripts")
 | |
| 	err = markup.Render(&markup.RenderContext{
 | |
| 		Ctx:          ctx,
 | |
| 		RelativePath: ctx.Repo.TreePath,
 | |
| 		Links: markup.Links{
 | |
| 			Base:       ctx.Repo.RepoLink,
 | |
| 			BranchPath: ctx.Repo.BranchNameSubURL(),
 | |
| 			TreePath:   path.Dir(ctx.Repo.TreePath),
 | |
| 		},
 | |
| 		Metas:            ctx.Repo.Repository.ComposeDocumentMetas(ctx),
 | |
| 		GitRepo:          ctx.Repo.GitRepo,
 | |
| 		InStandalonePage: true,
 | |
| 	}, rd, ctx.Resp)
 | |
| 	if err != nil {
 | |
| 		ctx.ServerError("Render", err)
 | |
| 		return
 | |
| 	}
 | |
| }
 |