feat: Inital commit
This commit is contained in:
+153
@@ -0,0 +1,153 @@
|
||||
/*
|
||||
* Copyright 2020 National Library of Norway.
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
package url
|
||||
|
||||
import (
|
||||
"unicode"
|
||||
|
||||
"github.com/bits-and-blooms/bitset"
|
||||
)
|
||||
|
||||
type PercentEncodeSet struct {
|
||||
bs *bitset.BitSet
|
||||
allBelow int32
|
||||
}
|
||||
|
||||
func NewPercentEncodeSet(allBelow int32, bytes ...uint) *PercentEncodeSet {
|
||||
p := &PercentEncodeSet{allBelow: allBelow, bs: bitset.New(0x7f)}
|
||||
for _, b := range bytes {
|
||||
p.bs.Set(b)
|
||||
}
|
||||
return p
|
||||
}
|
||||
|
||||
func (p *PercentEncodeSet) Set(bytes ...uint) *PercentEncodeSet {
|
||||
r := &PercentEncodeSet{
|
||||
allBelow: p.allBelow,
|
||||
bs: p.bs.Clone(),
|
||||
}
|
||||
for _, b := range bytes {
|
||||
r.bs.Set(b)
|
||||
}
|
||||
return r
|
||||
}
|
||||
|
||||
func (p *PercentEncodeSet) Clear(bytes ...uint) *PercentEncodeSet {
|
||||
r := &PercentEncodeSet{
|
||||
allBelow: p.allBelow,
|
||||
bs: p.bs.Clone(),
|
||||
}
|
||||
for _, b := range bytes {
|
||||
r.bs.Clear(b)
|
||||
}
|
||||
return r
|
||||
}
|
||||
|
||||
func (p *PercentEncodeSet) RuneShouldBeEncoded(r rune) bool {
|
||||
if r < p.allBelow || r > 0x007E || p.bs.Test(uint(r)) {
|
||||
return true
|
||||
}
|
||||
return false
|
||||
}
|
||||
|
||||
func (p *PercentEncodeSet) ByteShouldBeEncoded(b byte) bool {
|
||||
if int32(b) < p.allBelow || b > 0x007E || p.bs.Test(uint(b)) {
|
||||
return true
|
||||
}
|
||||
return false
|
||||
}
|
||||
|
||||
func (p *PercentEncodeSet) RuneNotInSet(r rune) bool {
|
||||
if r < p.allBelow || p.bs.Test(uint(r)) {
|
||||
return false
|
||||
}
|
||||
return true
|
||||
}
|
||||
|
||||
func isURLCodePoint(r rune) bool {
|
||||
if ASCIIAlphanumeric.Test(uint(r)) {
|
||||
return true
|
||||
}
|
||||
if someURLCodePoints.Test(uint(r)) {
|
||||
return true
|
||||
}
|
||||
if r >= 0xa0 && r <= 0x10fffd {
|
||||
if unicode.Is(unicode.Noncharacter_Code_Point, r) {
|
||||
return false
|
||||
}
|
||||
if unicode.Is(unicode.Cs, r) {
|
||||
return false
|
||||
}
|
||||
return true
|
||||
}
|
||||
return false
|
||||
}
|
||||
|
||||
var ASCIITabOrNewline = bitset.New(0x0d).Set(0x09).Set(0x0a).Set(0x0d)
|
||||
var ASCIIAlpha = bitset.New(0x7a)
|
||||
var ASCIIDigit = bitset.New(0x39)
|
||||
var ASCIIHexDigit = bitset.New(0x66)
|
||||
var ASCIIAlphanumeric = bitset.New(0x7a)
|
||||
var C0control = bitset.New(0x1f)
|
||||
var C0controlOrSpace = bitset.New(0x20).Set(0x20)
|
||||
var ForbiddenHostCodePoint = bitset.New(0x7c).Set(0x00).Set(0x09).Set(0x0a).Set(0x0d).Set(0x20).
|
||||
Set(0x23).Set(0x2f).Set(0x3a).Set(0x3c).Set(0x3e).Set(0x3f).Set(0x40).Set(0x5b).
|
||||
Set(0x5c).Set(0x5d).Set(0x5e).Set(0x7c)
|
||||
var ForbiddenDomainCodePoint = ForbiddenHostCodePoint.Clone().Set(0x25).Set(0x7f)
|
||||
var someURLCodePoints = bitset.New(0x7e).Set(0x24).Set(0x26).Set(0x27).Set(0x28).Set(0x29).
|
||||
Set(0x2a).Set(0x2b).Set(0x2c).Set(0x2d).Set(0x2e).Set(0x2f).Set(0x3a).Set(0x3b).Set(0x3d).
|
||||
Set(0x3f).Set(0x40).Set(0x5f).Set(0x7e)
|
||||
|
||||
var C0PercentEncodeSet = NewPercentEncodeSet(0x20)
|
||||
var C0OrSpacePercentEncodeSet = NewPercentEncodeSet(0x21)
|
||||
var FragmentPercentEncodeSet = C0OrSpacePercentEncodeSet.Set(0x22, 0x3c, 0x3e, 0x60)
|
||||
var QueryPercentEncodeSet = C0OrSpacePercentEncodeSet.Set(0x22, 0x23, 0x3C, 0x3E)
|
||||
var SpecialQueryPercentEncodeSet = QueryPercentEncodeSet.Set(0x27)
|
||||
var PathPercentEncodeSet = QueryPercentEncodeSet.Set(0x3f, 0x60, 0x7b, 0x7d)
|
||||
var UserInfoPercentEncodeSet = PathPercentEncodeSet.Set(0x2f, 0x3a, 0x3b, 0x3d, 0x40, 0x5b, 0x5c, 0x5d, 0x5e, 0x7c)
|
||||
var HostPercentEncodeSet = C0OrSpacePercentEncodeSet.Set(0x23)
|
||||
|
||||
func init() {
|
||||
for i := 'a'; i <= 'z'; i++ {
|
||||
ASCIIAlpha.Set(uint(i))
|
||||
}
|
||||
for i := 'A'; i <= 'Z'; i++ {
|
||||
ASCIIAlpha.Set(uint(i))
|
||||
}
|
||||
|
||||
for i := '0'; i <= '9'; i++ {
|
||||
ASCIIDigit.Set(uint(i))
|
||||
}
|
||||
|
||||
ASCIIAlphanumeric.InPlaceUnion(ASCIIAlpha)
|
||||
ASCIIAlphanumeric.InPlaceUnion(ASCIIDigit)
|
||||
|
||||
ASCIIHexDigit.InPlaceUnion(ASCIIDigit)
|
||||
for i := 'A'; i <= 'F'; i++ {
|
||||
ASCIIHexDigit.Set(uint(i))
|
||||
}
|
||||
for i := 'a'; i <= 'f'; i++ {
|
||||
ASCIIHexDigit.Set(uint(i))
|
||||
}
|
||||
|
||||
// Add C0 control characters
|
||||
for i := 0x00; i <= 0x1f; i++ {
|
||||
C0control.Set(uint(i))
|
||||
C0controlOrSpace.Set(uint(i))
|
||||
ForbiddenDomainCodePoint.Set(uint(i))
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user