1
0
mirror of https://github.com/fumiama/go-base16384.git synced 2026-06-05 00:32:52 +08:00

finish arm64 encode

This commit is contained in:
源文雨
2022-12-13 17:08:02 +08:00
parent d47127dc75
commit 5e0f486237
5 changed files with 277 additions and 3 deletions

View File

@@ -118,7 +118,7 @@ encsav:
ADDQ CX, DX
SHLQ $3, SI
MOVQ DX, ·sum+64(FP)
MOVQ SI, ·sum+72(FP)
MOVQ SI, ·n+72(FP)
encend:
RET

45
base14_arm64.go Normal file
View File

@@ -0,0 +1,45 @@
//go:build arm64
// +build arm64
package base14
import (
"encoding/binary"
"unsafe"
)
//go:noescape
//go:nosplit
func _encode(offset, outlen int, b, encd []byte) (sum uint64, valn uintptr)
//go:noescape
//go:nosplit
func _decode(offset, outlen int, b, decd []byte)
func encode(offset, outlen int, b, encd []byte) {
if len(b) == 7 {
b = append(b, 0)
}
sum, valn := _encode(offset, outlen, b, encd)
if offset == 0 {
return
}
n := valn - (uintptr)(*(*unsafe.Pointer)(unsafe.Pointer(&encd)))
println(sum, n)
var tmp [4]byte
binary.LittleEndian.PutUint32(tmp[:], uint32(sum))
copy(encd[n:], tmp[:])
encd[outlen-2] = '='
encd[outlen-1] = byte(offset)
}
func decode(offset, outlen int, b, decd []byte) {
/*
if offset != 0 && cap(b) == len(b) {
b = append(b, make([]byte, 8)...)
}
_decode(offset, outlen, b, decd)
*/
decodeGeneric(offset, outlen, b, decd)
}

123
base14_arm64.s Normal file
View File

@@ -0,0 +1,123 @@
//go:build arm64
// +build arm64
#include "textflag.h"
// func _encode(offset, outlen int, b, encd []byte) (sum uint64, &vals[n] uintptr)
TEXT ·_encode(SB), NOSPLIT, $0-81
MOVD ·offset+0(FP), R0
MOVD ·data+16(FP), R9
MOVD ·dlen+24(FP), R3
MOVD ·encd+40(FP), R5
SUBW $6, R3, R3
CMPW $0, R3
BLE enctil
MOVW $0x4e00, R11
SUB $8, R5, R14
SUB $4, R5, R13
MOVD $2, R8
MOVW $0, R10 // int32_t i = 0
MOVK $(0x4e00<<16), R11
enclop:
MOVW (R9), R4
ADDW $7, R10, R10
MOVW R8, R12
CMPW R3, R10
REVW R4, R4
ADD $7, R9, R9
LSRW $2, R4, R6
UBFX $4, R4, $14, R15
ANDW $0x3fff0000, R6, R6
UBFIZW $26, R4, $4, R7
ORRW R15, R6, R6
ADDW R11, R6, R6
REVW R6, R6
MOVW R6, (R14)(R8<<2)
MOVW -3(R9), R4
REVW R4, R4
LSRW $6, R4, R4
ANDW $0x3fffffc, R4, R4
ORRW R7, R4, R4
ANDW $0x3fff0000, R4, R6
UBFX $2, R4, $14, R4
ORRW R6, R4, R4
ADDW R11, R4, R4
REVW R4, R4
MOVW R4, (R13)(R8<<2)
ADDW $2, R8, R8
BLT enclop
encrem:
ANDSW $0xff, R0, R0
BEQ encret
MOVBU (R2)(R10.SXTW), R3
UXTW R12, R8
CMPW $1, R0
SXTW R10, R10
ADD R8<<2, R5, R7
UBFIZW $14, R3, $2, R4
ORRW R3>>2, R4, R3
BEQ encsum
ADD R10, R2, R9
CMPW $2, R0
MOVBU 1(R9), R6
LSLW $6, R6, R4
UBFIZW $20, R6, $2, R6
ANDW $0x3f00, R4, R4
ORRW R3, R4, R3
ORRW R3, R6, R3
BEQ encsum
MOVBU 2(R9), R4
CMPW $3, R0
LSLW $12, R4, R6
ANDW $0xf0000, R6, R6
ORRW R4<<28, R6, R4
ORRW R4, R3, R3
BEQ encsum
ADD $3, R10, R10
ADDW $1, R12, R12
CMPW $4, R0
ADD R12<<2, R5, R7
MOVBU (R2)(R10), R4
LSLW $20, R4, R4
ANDW $0xf000000, R4, R4
ORRW R3, R4, R3
ADDW $0x4e0000, R3, R3
ADDW $78, R3, R3
MOVW R3, (R5)(R8<<2)
MOVBU (R2)(R10), R3
UBFIZW $2, R3, $4, R3
BEQ encsum
MOVBU 4(R9), R4
CMPW $5, R0
UBFIZW $10, R4, $6, R2
ORRW R3, R2, R3
ORRW R4>>6, R3, R3
BEQ encsum
MOVBU 5(R9), R4
LSLW $2, R4, R2
UBFIZW $16, R4, $6, R4
ANDW $0x300, R2, R2
ORRW R4, R2, R2
ORRW R2, R3, R3
encsum:
ADDW $0x4e0000, R3, R3
ADDW $0x4e, R3, R3
MOVD R3, ·sum+64(FP)
MOVD R7, ·n+72(FP)
encret:
RET
enctil:
MOVW $0, R10
MOVW $0, R12
JMP encrem
// func _decode(offset, outlen int, b, decd []byte)
TEXT ·_decode(SB), NOSPLIT, $0-64

View File

@@ -1,5 +1,5 @@
//go:build !amd64
// +build !amd64
//go:build !amd64 && !arm64
// +build !amd64,!arm64
package base14

106
c/base1432.c Normal file
View File

@@ -0,0 +1,106 @@
#ifdef __cosmopolitan // always le
# define be16toh(x) bswap_16(x)
# define be32toh(x) bswap_32(x)
# define htobe16(x) bswap_16(x)
# define htobe32(x) bswap_32(x)
#else
#include <stdio.h>
#include <stdint.h>
#include <stdlib.h>
#ifdef __linux__
# include <endian.h>
#endif
#ifdef __FreeBSD__
# include <sys/endian.h>
#endif
#ifdef __NetBSD__
# include <sys/endian.h>
#endif
#ifdef __OpenBSD__
# include <sys/types.h>
# define be16toh(x) betoh16(x)
# define be32toh(x) betoh32(x)
#endif
#ifdef __MAC_10_0
# define be16toh(x) ntohs(x)
# define be32toh(x) ntohl(x)
# define htobe16(x) ntohs(x)
# define htobe32(x) htonl(x)
#endif
#ifdef _WIN32
#ifdef WORDS_BIGENDIAN
# define be16toh(x) (x)
# define be32toh(x) (x)
# define htobe16(x) (x)
# define htobe32(x) (x)
#else
# define be16toh(x) _byteswap_ushort(x)
# define be32toh(x) _byteswap_ulong(x)
# define htobe16(x) _byteswap_ushort(x)
# define htobe32(x) _byteswap_ulong(x)
#endif
#endif
#endif
int base16384_encode(int offset, int outlen, const char* data, int dlen, int dcap, char* buf, int blen, int bcap) {
uint32_t* vals = (uint32_t*)buf;
uint32_t n = 0;
int32_t i = 0;
for(; i <= dlen - 7; i += 7) {
register uint32_t sum = 0;
register uint32_t shift = htobe32(*(uint32_t*)(data+i));
sum |= (shift>>2) & 0x3fff0000;
sum |= (shift>>4) & 0x00003fff;
sum += 0x4e004e00;
vals[n++] = be32toh(sum);
shift <<= 26;
shift &= 0x3c000000;
sum = 0;
shift |= (htobe32(*(uint32_t*)(data+i+4))>>6)&0x03fffffc;
sum |= shift & 0x3fff0000;
shift >>= 2;
sum |= shift & 0x00003fff;
sum += 0x4e004e00;
vals[n++] = be32toh(sum);
}
uint8_t o = offset;
if(o--) {
register uint32_t sum = 0x0000003f & (data[i] >> 2);
sum |= ((uint32_t)data[i] << 14) & 0x0000c000;
if(o--) {
sum |= ((uint32_t)data[i + 1] << 6) & 0x00003f00;
sum |= ((uint32_t)data[i + 1] << 20) & 0x00300000;
if(o--) {
sum |= ((uint32_t)data[i + 2] << 12) & 0x000f0000;
sum |= ((uint32_t)data[i + 2] << 28) & 0xf0000000;
if(o--) {
sum |= ((uint32_t)data[i + 3] << 20) & 0x0f000000;
sum += 0x004e004e;
#ifdef WORDS_BIGENDIAN
vals[n++] = __builtin_bswap32(sum);
#else
vals[n++] = sum;
#endif
sum = (((uint32_t)data[i + 3] << 2)) & 0x0000003c;
if(o--) {
sum |= (((uint32_t)data[i + 4] >> 6)) & 0x00000003;
sum |= ((uint32_t)data[i + 4] << 10) & 0x0000fc00;
if(o--) {
sum |= ((uint32_t)data[i + 5] << 2) & 0x00000300;
sum |= ((uint32_t)data[i + 5] << 16) & 0x003f0000;
}
}
}
}
}
sum += 0x004e004e;
#ifdef WORDS_BIGENDIAN
vals[n] = __builtin_bswap32(sum);
#else
vals[n] = sum;
#endif
buf[outlen - 2] = '=';
buf[outlen - 1] = offset;
}
return outlen;
}